diff --git a/.ipynb_checkpoints/model.safetensors.index-checkpoint.json b/.ipynb_checkpoints/model.safetensors.index-checkpoint.json new file mode 100644 index 0000000000000000000000000000000000000000..21bd4e588fca6f050f6edcdd47a6fc961142c720 --- /dev/null +++ b/.ipynb_checkpoints/model.safetensors.index-checkpoint.json @@ -0,0 +1,80451 @@ +{ + "metadata": {}, + "weight_map": { + "model.embed_tokens.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.0.mlp.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.0.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.0.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.1.mlp.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.1.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.1.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.2.mlp.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.2.input_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.2.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.gate.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.gate.e_score_correction_bias": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.shared_experts.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.0.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.1.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.2.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.3.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.4.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.5.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.6.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.7.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.8.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.9.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.10.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.11.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.12.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.13.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.14.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.15.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.16.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.17.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.18.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.19.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.20.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.21.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.22.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.23.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.24.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.25.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.26.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.27.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.28.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.29.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.30.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight": "model-00001-of-000163.safetensors", + "model.layers.3.mlp.experts.31.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.31.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.32.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.33.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.34.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.35.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.36.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.37.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.38.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.39.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.40.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.41.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.42.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.43.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.44.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.45.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.46.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.47.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.48.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.49.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.50.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.51.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.52.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.53.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.54.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.55.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.56.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.57.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.58.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.59.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.60.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.61.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.62.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.63.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.64.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.65.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.66.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.67.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.68.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.69.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.70.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.71.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.72.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.73.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.74.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.75.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.76.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.77.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.78.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.79.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.80.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.81.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.82.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.83.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.84.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.85.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.86.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.87.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.88.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.89.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.90.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.91.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.92.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.93.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.94.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.95.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.96.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.97.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.98.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.99.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.100.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.101.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.102.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.103.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.104.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.105.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.106.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.107.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.108.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.109.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.110.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.111.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.112.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.113.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.114.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.115.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.116.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.117.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.118.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.119.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.120.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.121.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.122.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.123.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.124.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.125.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.126.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.127.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.up_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.down_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.128.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00002-of-000163.safetensors", + "model.layers.3.mlp.experts.129.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.129.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.129.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.129.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.129.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.130.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.131.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.132.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.133.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.134.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.135.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.136.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.137.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.138.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.139.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.140.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.141.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.142.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.143.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.144.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.145.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.146.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.147.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.148.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.149.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.150.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.151.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.152.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.153.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.154.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.155.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.156.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.157.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.158.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.159.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.160.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.161.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.162.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.163.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.164.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.165.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.166.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.167.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.168.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.169.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.170.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.171.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.172.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.173.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.174.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.175.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.176.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.177.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.178.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.179.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.180.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.181.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.182.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.183.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.184.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.185.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.186.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.187.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.188.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.189.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.190.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.191.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.192.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.193.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.194.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.195.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.196.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.197.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.198.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.199.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.200.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.201.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.202.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.203.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.204.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.205.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.206.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.207.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.208.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.209.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.210.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.211.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.212.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.213.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.214.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.215.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.216.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.217.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.218.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.219.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.220.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.221.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.222.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.223.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.224.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.225.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.gate_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.up_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.down_proj.weight": "model-00003-of-000163.safetensors", + "model.layers.3.mlp.experts.226.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.227.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.228.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.229.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.230.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.231.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.232.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.233.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.234.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.235.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.236.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.237.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.238.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.239.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.240.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.241.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.242.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.243.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.244.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.245.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.246.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.247.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.248.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.249.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.250.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.251.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.252.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.253.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.254.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.3.mlp.experts.255.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.3.input_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.3.post_attention_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_a_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_a_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_a_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_b_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.q_b_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_a_proj_with_mqa.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_a_layernorm.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_b_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.kv_b_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.o_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.self_attn.o_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.gate.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.gate.e_score_correction_bias": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.shared_experts.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.0.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.1.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.2.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.3.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.4.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.5.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.6.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.7.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.8.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.9.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.10.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.11.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.12.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.13.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.14.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.15.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.16.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.17.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.18.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.19.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.20.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.21.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.22.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.23.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.24.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.25.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.26.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.27.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.28.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.29.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.30.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.31.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.32.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.33.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.34.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.35.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.36.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.37.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.38.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.39.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.40.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.41.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.42.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.43.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.44.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.45.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.46.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.47.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.48.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.49.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.50.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.51.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.52.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.53.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.54.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.55.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.56.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.57.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.58.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.59.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.60.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.61.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.62.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00004-of-000163.safetensors", + "model.layers.4.mlp.experts.63.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.63.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.63.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.64.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.65.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.66.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.67.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.68.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.69.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.70.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.71.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.72.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.73.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.74.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.75.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.76.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.77.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.78.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.79.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.80.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.81.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.82.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.83.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.84.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.85.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.86.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.87.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.88.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.89.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.90.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.91.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.92.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.93.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.94.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.95.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.96.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.97.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.98.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.99.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.100.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.101.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.102.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.103.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.104.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.105.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.106.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.107.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.108.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.109.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.110.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.111.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.112.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.113.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.114.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.115.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.116.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.117.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.118.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.119.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.120.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.121.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.122.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.123.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.124.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.125.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.126.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.127.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.128.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.129.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.130.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.131.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.132.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.133.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.134.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.135.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.136.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.137.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.138.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.139.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.140.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.141.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.142.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.143.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.144.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.145.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.146.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.147.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.148.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.149.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.150.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.151.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.152.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.153.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.154.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.155.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.156.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.157.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.158.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.159.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.gate_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.up_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.down_proj.weight": "model-00005-of-000163.safetensors", + "model.layers.4.mlp.experts.160.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.161.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.162.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.163.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.164.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.165.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.166.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.167.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.168.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.169.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.170.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.171.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.172.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.173.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.174.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.175.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.176.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.177.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.178.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.179.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.180.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.181.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.182.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.183.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.184.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.185.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.186.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.187.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.188.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.189.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.190.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.191.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.192.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.193.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.194.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.195.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.196.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.197.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.198.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.199.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.200.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.201.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.202.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.203.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.204.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.205.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.206.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.207.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.208.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.209.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.210.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.211.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.212.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.213.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.214.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.215.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.216.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.217.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.218.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.219.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.220.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.221.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.222.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.223.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.224.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.225.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.226.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.227.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.228.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.229.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.230.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.231.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.232.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.233.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.234.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.235.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.236.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.237.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.238.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.239.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.240.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.241.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.242.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.243.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.244.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.245.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.246.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.247.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.248.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.249.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.250.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.251.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.252.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.253.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.254.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.gate_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.up_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.down_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.4.mlp.experts.255.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.4.input_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.4.post_attention_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_a_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_a_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_a_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_b_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.q_b_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_a_proj_with_mqa.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_a_layernorm.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_b_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.kv_b_proj.weight_scale_inv": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.o_proj.weight": "model-00006-of-000163.safetensors", + "model.layers.5.self_attn.o_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.gate.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.gate.e_score_correction_bias": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.shared_experts.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.0.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.1.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.2.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.3.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.4.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.5.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.6.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.7.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.8.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.9.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.10.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.11.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.12.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.13.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.14.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.15.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.16.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.17.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.18.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.19.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.20.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.21.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.22.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.23.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.24.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.25.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.26.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.27.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.28.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.29.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.30.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.31.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.32.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.33.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.34.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.35.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.36.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.37.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.38.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.39.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.40.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.41.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.42.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.43.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.44.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.45.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.46.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.47.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.48.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.49.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.50.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.51.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.52.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.53.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.54.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.55.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.56.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.57.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.58.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.59.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.60.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.61.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.62.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.63.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.64.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.65.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.66.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.67.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.68.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.69.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.70.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.71.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.72.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.73.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.74.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.75.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.76.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.77.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.78.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.79.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.80.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.81.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.82.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.83.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.84.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.85.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.86.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.87.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.88.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.89.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.90.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.91.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.92.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.93.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.94.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.95.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight": "model-00007-of-000163.safetensors", + "model.layers.5.mlp.experts.96.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.96.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.97.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.98.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.99.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.100.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.101.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.102.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.103.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.104.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.105.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.106.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.107.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.108.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.109.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.110.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.111.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.112.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.113.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.114.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.115.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.116.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.117.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.118.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.119.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.120.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.121.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.122.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.123.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.124.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.125.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.126.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.127.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.128.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.129.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.130.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.131.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.132.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.133.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.134.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.135.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.136.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.137.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.138.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.139.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.140.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.141.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.142.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.143.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.144.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.145.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.146.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.147.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.148.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.149.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.150.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.151.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.152.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.153.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.154.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.155.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.156.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.157.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.158.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.159.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.160.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.161.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.162.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.163.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.164.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.165.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.166.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.167.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.168.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.169.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.170.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.171.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.172.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.173.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.174.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.175.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.176.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.177.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.178.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.179.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.180.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.181.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.182.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.183.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.184.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.185.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.186.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.187.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.188.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.189.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.190.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.191.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.192.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.up_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.down_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.193.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.194.gate_proj.weight": "model-00008-of-000163.safetensors", + "model.layers.5.mlp.experts.194.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.194.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.194.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.194.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.194.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.195.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.196.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.197.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.198.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.199.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.200.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.201.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.202.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.203.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.204.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.205.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.206.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.207.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.208.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.209.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.210.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.211.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.212.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.213.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.214.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.215.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.216.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.217.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.218.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.219.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.220.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.221.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.222.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.223.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.224.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.225.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.226.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.227.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.228.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.229.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.230.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.231.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.232.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.233.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.234.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.235.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.236.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.237.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.238.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.239.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.240.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.241.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.242.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.243.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.244.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.245.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.246.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.247.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.248.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.249.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.250.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.251.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.252.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.253.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.254.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.5.mlp.experts.255.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.5.input_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.5.post_attention_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_a_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_a_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_a_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_b_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.q_b_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_a_proj_with_mqa.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_a_layernorm.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_b_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.kv_b_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.o_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.self_attn.o_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.gate.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.gate.e_score_correction_bias": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.shared_experts.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.0.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.1.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.2.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.3.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.4.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.5.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.6.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.7.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.8.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.9.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.10.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.11.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.12.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.13.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.14.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.15.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.16.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.17.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.18.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.19.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.20.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.21.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.22.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.23.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.24.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.25.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.26.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.27.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.28.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.29.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight": "model-00009-of-000163.safetensors", + "model.layers.6.mlp.experts.30.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.30.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.31.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.32.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.33.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.34.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.35.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.36.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.37.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.38.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.39.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.40.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.41.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.42.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.43.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.44.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.45.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.46.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.47.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.48.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.49.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.50.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.51.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.52.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.53.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.54.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.55.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.56.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.57.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.58.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.59.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.60.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.61.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.62.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.63.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.64.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.65.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.66.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.67.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.68.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.69.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.70.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.71.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.72.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.73.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.74.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.75.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.76.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.77.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.78.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.79.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.80.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.81.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.82.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.83.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.84.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.85.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.86.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.87.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.88.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.89.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.90.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.91.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.92.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.93.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.94.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.95.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.96.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.97.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.98.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.99.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.100.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.101.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.102.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.103.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.104.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.105.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.106.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.107.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.108.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.109.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.110.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.111.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.112.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.113.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.114.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.115.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.116.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.117.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.118.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.119.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.120.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.121.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.122.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.123.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.124.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.125.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.126.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.127.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00010-of-000163.safetensors", + "model.layers.6.mlp.experts.128.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.128.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.128.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.128.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.128.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.129.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.130.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.131.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.132.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.133.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.134.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.135.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.136.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.137.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.138.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.139.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.140.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.141.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.142.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.143.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.144.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.145.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.146.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.147.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.148.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.149.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.150.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.151.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.152.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.153.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.154.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.155.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.156.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.157.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.158.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.159.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.160.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.161.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.162.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.163.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.164.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.165.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.166.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.167.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.168.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.169.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.170.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.171.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.172.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.173.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.174.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.175.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.176.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.177.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.178.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.179.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.180.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.181.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.182.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.183.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.184.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.185.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.186.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.187.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.188.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.189.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.190.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.191.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.192.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.193.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.194.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.195.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.196.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.197.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.198.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.199.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.200.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.201.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.202.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.203.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.204.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.205.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.206.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.207.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.208.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.209.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.210.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.211.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.212.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.213.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.214.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.215.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.216.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.217.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.218.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.219.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.220.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.221.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.222.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.223.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.224.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.gate_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.up_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.down_proj.weight": "model-00011-of-000163.safetensors", + "model.layers.6.mlp.experts.225.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.226.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.227.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.228.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.229.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.230.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.231.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.232.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.233.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.234.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.235.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.236.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.237.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.238.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.239.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.240.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.241.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.242.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.243.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.244.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.245.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.246.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.247.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.248.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.249.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.250.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.251.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.252.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.253.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.254.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.gate_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.up_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.down_proj.weight": "model-00012-of-000163.safetensors", + "model.layers.6.mlp.experts.255.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", + "model.layers.6.input_layernorm.weight": "model-00012-of-000163.safetensors", + "model.layers.6.post_attention_layernorm.weight": "model-00012-of-000163.safetensors", + "model.layers.7.self_attn.q_a_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.q_a_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.q_a_layernorm.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.q_b_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.q_b_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_a_proj_with_mqa.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_a_layernorm.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_b_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.kv_b_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.o_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.self_attn.o_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.gate.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.gate.e_score_correction_bias": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.shared_experts.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.0.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.1.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.2.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.3.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.4.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.5.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.6.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.7.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.8.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.9.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.10.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.11.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.12.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.13.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.14.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.15.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.16.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.17.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.18.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.19.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.20.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.21.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.22.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.23.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.24.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.25.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.26.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.27.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.28.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.29.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.30.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.31.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.32.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.33.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.34.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.35.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.36.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.37.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.38.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.39.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.40.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.41.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.42.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.43.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.44.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.45.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.46.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.47.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.48.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.49.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.50.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.51.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.52.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.53.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.54.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.55.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.56.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.57.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.58.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.59.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.60.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.61.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.62.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.63.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.64.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.65.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.66.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.67.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.68.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.69.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.70.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.71.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.72.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.73.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.74.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.75.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.76.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.77.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.78.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.79.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.80.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.81.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.82.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.83.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.84.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.85.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.86.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.87.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.88.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.89.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.90.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.91.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00013-of-000163.safetensors", + "model.layers.7.mlp.experts.92.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.92.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.92.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.93.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.94.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.95.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.96.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.97.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.98.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.99.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.100.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.101.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.102.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.103.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.104.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.105.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.106.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.107.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.108.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.109.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.110.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.111.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.112.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.113.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.114.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.115.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.116.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.117.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.118.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.119.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.120.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.121.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.122.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.123.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.124.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.125.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.126.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.127.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.128.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.129.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.130.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.131.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.132.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.133.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.134.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.135.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.136.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.137.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.138.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.139.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.140.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.141.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.142.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.143.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.144.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.145.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.146.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.147.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.148.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.149.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.150.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.151.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.152.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.153.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.154.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.155.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.156.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.157.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.158.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.159.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.160.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.161.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.162.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.163.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.164.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.165.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.166.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.167.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.168.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.169.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.170.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.171.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.172.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.173.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.174.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.175.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.176.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.177.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.178.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.179.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.180.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.181.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.182.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.183.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.184.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.185.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.186.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.187.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.188.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.gate_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.up_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.down_proj.weight": "model-00014-of-000163.safetensors", + "model.layers.7.mlp.experts.189.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.190.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.191.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.192.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.193.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.194.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.195.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.196.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.197.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.198.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.199.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.200.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.201.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.202.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.203.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.204.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.205.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.206.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.207.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.208.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.209.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.210.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.211.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.212.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.213.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.214.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.215.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.216.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.217.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.218.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.219.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.220.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.221.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.222.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.223.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.224.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.225.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.226.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.227.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.228.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.229.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.230.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.231.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.232.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.233.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.234.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.235.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.236.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.237.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.238.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.239.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.240.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.241.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.242.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.243.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.244.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.245.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.246.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.247.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.248.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.249.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.250.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.251.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.252.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.253.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.254.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.7.mlp.experts.255.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.7.input_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.7.post_attention_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_a_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_a_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_a_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_b_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.q_b_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_a_proj_with_mqa.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_a_layernorm.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_b_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.kv_b_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.o_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.self_attn.o_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.gate.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.gate.e_score_correction_bias": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.shared_experts.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.0.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.1.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.2.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.3.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.4.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.5.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.6.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.7.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.8.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.9.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.10.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.11.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.12.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.13.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.14.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.15.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.16.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.17.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.18.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.19.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.20.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.21.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.22.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.23.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.24.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.25.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00015-of-000163.safetensors", + "model.layers.8.mlp.experts.26.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.26.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.26.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.27.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.28.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.29.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.30.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.31.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.32.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.33.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.34.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.35.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.36.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.37.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.38.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.39.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.40.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.41.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.42.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.43.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.44.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.45.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.46.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.47.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.48.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.49.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.50.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.51.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.52.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.53.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.54.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.55.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.56.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.57.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.58.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.59.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.60.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.61.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.62.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.63.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.64.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.65.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.66.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.67.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.68.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.69.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.70.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.71.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.72.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.73.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.74.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.75.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.76.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.77.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.78.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.79.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.80.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.81.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.82.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.83.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.84.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.85.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.86.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.87.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.88.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.89.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.90.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.91.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.92.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.93.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.94.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.95.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.96.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.97.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.98.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.99.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.100.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.101.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.102.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.103.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.104.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.105.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.106.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.107.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.108.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.109.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.110.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.111.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.112.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.113.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.114.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.115.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.116.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.117.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.118.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.119.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.120.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.121.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.122.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight": "model-00016-of-000163.safetensors", + "model.layers.8.mlp.experts.123.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.124.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.125.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.126.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.127.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.128.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.129.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.130.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.131.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.132.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.133.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.134.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.135.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.136.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.137.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.138.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.139.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.140.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.141.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.142.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.143.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.144.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.145.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.146.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.147.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.148.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.149.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.150.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.151.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.152.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.153.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.154.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.155.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.156.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.157.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.158.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.159.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.160.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.161.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.162.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.163.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.164.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.165.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.166.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.167.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.168.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.169.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.170.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.171.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.172.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.173.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.174.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.175.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.176.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.177.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.178.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.179.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.180.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.181.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.182.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.183.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.184.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.185.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.186.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.187.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.188.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.189.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.190.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.191.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.192.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.193.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.194.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.195.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.196.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.197.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.198.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.199.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.200.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.201.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.202.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.203.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.204.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.205.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.206.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.207.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.208.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.209.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.210.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.211.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.212.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.213.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.214.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.215.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.216.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.217.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.218.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.219.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.down_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.220.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.gate_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.up_proj.weight": "model-00017-of-000163.safetensors", + "model.layers.8.mlp.experts.221.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.221.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.221.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.222.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.223.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.224.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.225.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.226.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.227.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.228.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.229.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.230.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.231.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.232.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.233.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.234.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.235.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.236.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.237.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.238.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.239.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.240.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.241.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.242.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.243.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.244.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.245.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.246.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.247.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.248.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.249.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.250.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.251.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.252.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.253.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.254.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.8.mlp.experts.255.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.8.input_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.8.post_attention_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_a_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_a_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_a_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_b_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.q_b_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_a_proj_with_mqa.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_a_layernorm.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_b_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.kv_b_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.o_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.self_attn.o_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.gate.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.gate.e_score_correction_bias": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.shared_experts.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.0.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.1.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.2.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.3.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.4.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.5.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.6.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.7.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.8.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.9.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.10.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.11.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.12.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.13.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.14.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.15.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.16.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.17.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.18.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.19.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.20.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.21.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.22.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.23.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.24.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.25.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.26.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.27.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.28.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.29.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.30.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.31.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.32.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.33.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.34.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.35.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.36.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.37.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.38.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.39.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.40.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.41.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.42.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.43.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.44.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.45.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.46.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.47.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.48.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.49.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.50.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.51.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.52.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.53.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.54.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.55.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.56.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight": "model-00018-of-000163.safetensors", + "model.layers.9.mlp.experts.57.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.58.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.59.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.60.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.61.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.62.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.63.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.64.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.65.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.66.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.67.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.68.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.69.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.70.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.71.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.72.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.73.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.74.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.75.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.76.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.77.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.78.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.79.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.80.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.81.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.82.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.83.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.84.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.85.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.86.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.87.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.88.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.89.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.90.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.91.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.92.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.93.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.94.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.95.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.96.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.97.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.98.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.99.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.100.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.101.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.102.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.103.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.104.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.105.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.106.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.107.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.108.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.109.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.110.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.111.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.112.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.113.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.114.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.115.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.116.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.117.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.118.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.119.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.120.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.121.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.122.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.123.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.124.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.125.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.126.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.127.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.128.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.129.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.130.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.131.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.132.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.133.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.134.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.135.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.136.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.137.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.138.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.139.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.140.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.141.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.142.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.143.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.144.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.145.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.146.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.147.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.148.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.149.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.150.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.151.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.152.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.153.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.down_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.154.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.up_proj.weight": "model-00019-of-000163.safetensors", + "model.layers.9.mlp.experts.155.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.155.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.155.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.156.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.157.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.158.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.159.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.160.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.161.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.162.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.163.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.164.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.165.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.166.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.167.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.168.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.169.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.170.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.171.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.172.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.173.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.174.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.175.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.176.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.177.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.178.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.179.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.180.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.181.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.182.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.183.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.184.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.185.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.186.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.187.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.188.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.189.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.190.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.191.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.192.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.193.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.194.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.195.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.196.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.197.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.198.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.199.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.200.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.201.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.202.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.203.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.204.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.205.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.206.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.207.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.208.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.209.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.210.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.211.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.212.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.213.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.214.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.215.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.216.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.217.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.218.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.219.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.220.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.221.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.222.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.223.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.224.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.225.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.226.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.227.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.228.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.229.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.230.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.231.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.232.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.233.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.234.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.235.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.236.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.237.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.238.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.239.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.240.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.241.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.242.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.243.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.244.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.245.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.246.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.247.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.248.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.249.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.250.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.251.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.up_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.down_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.252.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.253.gate_proj.weight": "model-00020-of-000163.safetensors", + "model.layers.9.mlp.experts.253.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.253.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.253.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.253.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.253.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.254.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.9.mlp.experts.255.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.9.input_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.9.post_attention_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_a_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_a_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_a_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_b_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.q_b_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_a_proj_with_mqa.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_a_layernorm.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_b_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.kv_b_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.o_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.self_attn.o_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.gate.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.gate.e_score_correction_bias": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.shared_experts.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.0.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.1.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.2.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.3.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.4.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.5.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.6.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.7.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.8.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.9.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.10.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.11.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.12.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.13.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.14.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.15.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.16.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.17.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.18.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.19.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.20.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.21.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.22.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.23.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.24.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.25.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.26.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.27.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.28.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.29.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.30.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.31.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.32.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.33.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.34.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.35.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.36.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.37.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.38.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.39.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.40.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.41.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.42.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.43.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.44.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.45.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.46.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.47.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.48.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.49.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.50.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.51.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.52.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.53.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.54.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.55.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.56.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.57.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.58.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.59.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.60.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.61.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.62.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.63.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.64.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.65.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.66.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.67.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.68.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.69.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.70.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.71.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.72.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.73.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.74.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.75.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.76.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.77.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.78.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.79.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.80.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.81.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.82.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.83.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.84.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.85.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.86.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.87.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.88.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight": "model-00021-of-000163.safetensors", + "model.layers.10.mlp.experts.89.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.89.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.90.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.91.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.92.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.93.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.94.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.95.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.96.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.97.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.98.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.99.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.100.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.101.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.102.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.103.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.104.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.105.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.106.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.107.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.108.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.109.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.110.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.111.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.112.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.113.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.114.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.115.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.116.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.117.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.118.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.119.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.120.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.121.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.122.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.123.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.124.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.125.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.126.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.127.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.128.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.129.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.130.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.131.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.132.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.133.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.134.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.135.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.136.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.137.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.138.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.139.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.140.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.141.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.142.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.143.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.144.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.145.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.146.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.147.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.148.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.149.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.150.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.151.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.152.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.153.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.154.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.155.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.156.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.157.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.158.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.159.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.160.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.161.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.162.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.163.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.164.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.165.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.166.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.167.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.168.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.169.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.170.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.171.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.172.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.173.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.174.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.175.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.176.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.177.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.178.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.179.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.180.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.181.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.182.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.183.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.184.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.185.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.up_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.down_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.186.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.187.gate_proj.weight": "model-00022-of-000163.safetensors", + "model.layers.10.mlp.experts.187.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.187.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.187.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.187.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.187.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.188.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.189.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.190.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.191.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.192.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.193.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.194.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.195.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.196.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.197.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.198.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.199.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.200.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.201.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.202.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.203.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.204.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.205.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.206.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.207.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.208.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.209.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.210.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.211.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.212.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.213.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.214.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.215.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.216.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.217.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.218.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.219.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.220.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.221.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.222.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.223.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.224.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.225.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.226.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.227.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.228.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.229.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.230.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.231.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.232.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.233.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.234.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.235.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.236.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.237.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.238.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.239.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.240.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.241.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.242.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.243.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.244.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.245.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.246.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.247.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.248.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.249.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.250.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.251.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.252.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.253.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.254.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.10.mlp.experts.255.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.10.input_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.10.post_attention_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_a_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_a_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_a_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_b_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.q_b_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_a_proj_with_mqa.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_a_layernorm.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_b_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.kv_b_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.o_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.self_attn.o_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.gate.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.gate.e_score_correction_bias": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.shared_experts.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.0.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.1.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.2.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.3.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.4.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.5.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.6.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.7.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.8.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.9.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.10.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.11.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.12.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.13.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.14.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.15.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.16.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.17.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.18.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.19.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.20.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.21.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.22.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight": "model-00023-of-000163.safetensors", + "model.layers.11.mlp.experts.23.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.23.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.24.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.25.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.26.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.27.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.28.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.29.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.30.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.31.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.32.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.33.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.34.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.35.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.36.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.37.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.38.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.39.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.40.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.41.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.42.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.43.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.44.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.45.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.46.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.47.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.48.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.49.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.50.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.51.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.52.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.53.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.54.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.55.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.56.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.57.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.58.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.59.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.60.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.61.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.62.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.63.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.64.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.65.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.66.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.67.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.68.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.69.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.70.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.71.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.72.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.73.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.74.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.75.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.76.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.77.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.78.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.79.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.80.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.81.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.82.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.83.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.84.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.85.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.86.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.87.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.88.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.89.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.90.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.91.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.92.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.93.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.94.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.95.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.96.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.97.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.98.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.99.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.100.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.101.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.102.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.103.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.104.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.105.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.106.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.107.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.108.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.109.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.110.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.111.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.112.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.113.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.114.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.115.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.116.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.117.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.118.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.119.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.120.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00024-of-000163.safetensors", + "model.layers.11.mlp.experts.121.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.121.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.121.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.122.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.123.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.124.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.125.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.126.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.127.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.128.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.129.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.130.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.131.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.132.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.133.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.134.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.135.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.136.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.137.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.138.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.139.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.140.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.141.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.142.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.143.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.144.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.145.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.146.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.147.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.148.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.149.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.150.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.151.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.152.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.153.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.154.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.155.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.156.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.157.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.158.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.159.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.160.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.161.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.162.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.163.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.164.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.165.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.166.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.167.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.168.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.169.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.170.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.171.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.172.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.173.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.174.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.175.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.176.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.177.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.178.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.179.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.180.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.181.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.182.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.183.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.184.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.185.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.186.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.187.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.188.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.189.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.190.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.191.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.192.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.193.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.194.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.195.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.196.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.197.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.198.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.199.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.200.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.201.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.202.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.203.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.204.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.205.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.206.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.207.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.208.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.209.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.210.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.211.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.212.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.213.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.214.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.215.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.216.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.217.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.gate_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.up_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.down_proj.weight": "model-00025-of-000163.safetensors", + "model.layers.11.mlp.experts.218.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.219.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.220.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.221.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.222.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.223.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.224.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.225.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.226.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.227.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.228.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.229.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.230.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.231.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.232.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.233.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.234.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.235.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.236.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.237.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.238.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.239.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.240.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.241.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.242.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.243.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.244.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.245.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.246.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.247.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.248.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.249.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.250.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.251.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.252.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.253.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.254.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.11.mlp.experts.255.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.11.input_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.11.post_attention_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_a_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_a_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_a_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_b_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.q_b_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_a_proj_with_mqa.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_a_layernorm.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_b_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.kv_b_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.o_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.self_attn.o_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.gate.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.gate.e_score_correction_bias": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.shared_experts.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.0.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.1.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.2.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.3.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.4.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.5.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.6.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.7.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.8.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.9.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.10.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.11.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.12.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.13.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.14.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.15.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.16.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.17.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.18.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.19.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.20.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.21.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.22.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.23.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.24.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.25.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.26.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.27.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.28.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.29.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.30.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.31.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.32.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.33.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.34.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.35.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.36.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.37.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.38.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.39.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.40.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.41.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.42.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.43.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.44.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.45.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.46.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.47.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.48.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.49.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.50.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.51.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.52.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.53.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.54.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00026-of-000163.safetensors", + "model.layers.12.mlp.experts.55.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.55.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.55.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.56.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.57.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.58.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.59.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.60.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.61.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.62.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.63.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.64.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.65.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.66.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.67.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.68.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.69.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.70.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.71.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.72.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.73.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.74.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.75.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.76.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.77.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.78.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.79.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.80.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.81.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.82.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.83.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.84.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.85.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.86.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.87.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.88.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.89.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.90.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.91.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.92.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.93.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.94.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.95.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.96.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.97.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.98.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.99.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.100.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.101.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.102.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.103.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.104.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.105.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.106.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.107.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.108.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.109.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.110.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.111.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.112.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.113.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.114.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.115.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.116.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.117.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.118.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.119.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.120.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.121.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.122.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.123.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.124.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.125.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.126.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.127.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.128.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.129.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.130.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.131.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.132.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.133.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.134.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.135.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.136.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.137.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.138.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.139.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.140.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.141.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.142.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.143.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.144.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.145.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.146.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.147.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.148.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.149.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.150.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.151.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.up_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.down_proj.weight": "model-00027-of-000163.safetensors", + "model.layers.12.mlp.experts.152.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.153.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.154.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.155.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.156.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.157.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.158.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.159.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.160.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.161.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.162.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.163.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.164.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.165.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.166.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.167.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.168.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.169.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.170.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.171.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.172.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.173.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.174.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.175.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.176.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.177.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.178.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.179.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.180.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.181.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.182.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.183.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.184.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.185.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.186.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.187.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.188.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.189.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.190.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.191.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.192.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.193.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.194.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.195.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.196.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.197.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.198.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.199.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.200.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.201.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.202.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.203.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.204.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.205.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.206.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.207.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.208.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.209.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.210.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.211.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.212.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.213.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.214.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.215.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.216.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.217.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.218.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.219.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.220.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.221.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.222.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.223.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.224.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.225.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.226.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.227.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.228.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.229.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.230.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.231.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.232.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.233.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.234.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.235.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.236.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.237.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.238.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.239.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.240.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.241.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.242.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.243.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.244.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.245.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.246.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.247.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.248.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.down_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.249.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.gate_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.up_proj.weight": "model-00028-of-000163.safetensors", + "model.layers.12.mlp.experts.250.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.250.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.250.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.251.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.252.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.253.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.254.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.12.mlp.experts.255.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.12.input_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.12.post_attention_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_a_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_a_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_a_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_b_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.q_b_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_a_proj_with_mqa.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_a_layernorm.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_b_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.kv_b_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.o_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.self_attn.o_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.gate.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.gate.e_score_correction_bias": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.shared_experts.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.0.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.1.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.2.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.3.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.4.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.5.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.6.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.7.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.8.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.9.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.10.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.11.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.12.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.13.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.14.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.15.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.16.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.17.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.18.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.19.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.20.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.21.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.22.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.23.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.24.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.25.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.26.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.27.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.28.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.29.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.30.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.31.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.32.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.33.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.34.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.35.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.36.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.37.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.38.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.39.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.40.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.41.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.42.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.43.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.44.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.45.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.46.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.47.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.48.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.49.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.50.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.51.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.52.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.53.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.54.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.55.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.56.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.57.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.58.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.59.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.60.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.61.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.62.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.63.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.64.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.65.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.66.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.67.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.68.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.69.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.70.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.71.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.72.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.73.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.74.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.75.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.76.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.77.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.78.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.79.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.80.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.81.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.82.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.83.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.84.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.85.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight": "model-00029-of-000163.safetensors", + "model.layers.13.mlp.experts.86.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.87.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.88.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.89.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.90.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.91.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.92.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.93.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.94.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.95.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.96.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.97.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.98.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.99.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.100.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.101.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.102.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.103.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.104.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.105.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.106.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.107.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.108.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.109.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.110.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.111.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.112.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.113.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.114.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.115.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.116.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.117.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.118.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.119.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.120.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.121.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.122.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.123.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.124.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.125.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.126.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.127.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.128.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.129.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.130.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.131.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.132.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.133.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.134.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.135.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.136.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.137.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.138.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.139.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.140.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.141.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.142.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.143.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.144.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.145.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.146.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.147.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.148.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.149.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.150.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.151.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.152.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.153.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.154.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.155.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.156.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.157.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.158.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.159.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.160.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.161.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.162.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.163.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.164.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.165.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.166.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.167.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.168.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.169.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.170.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.171.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.172.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.173.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.174.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.175.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.176.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.177.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.178.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.179.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.180.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.181.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.182.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.down_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.183.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.gate_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.up_proj.weight": "model-00030-of-000163.safetensors", + "model.layers.13.mlp.experts.184.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.184.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.184.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.185.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.186.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.187.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.188.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.189.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.190.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.191.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.192.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.193.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.194.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.195.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.196.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.197.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.198.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.199.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.200.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.201.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.202.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.203.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.204.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.205.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.206.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.207.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.208.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.209.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.210.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.211.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.212.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.213.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.214.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.215.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.216.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.217.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.218.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.219.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.220.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.221.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.222.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.223.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.224.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.225.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.226.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.227.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.228.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.229.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.230.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.231.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.232.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.233.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.234.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.235.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.236.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.237.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.238.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.239.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.240.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.241.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.242.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.243.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.244.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.245.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.246.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.247.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.248.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.249.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.250.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.251.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.252.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.253.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.254.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.13.mlp.experts.255.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.13.input_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.13.post_attention_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_a_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_a_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_a_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_b_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.q_b_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_a_proj_with_mqa.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_a_layernorm.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_b_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.kv_b_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.o_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.self_attn.o_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.gate.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.gate.e_score_correction_bias": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.shared_experts.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.0.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.1.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.2.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.3.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.4.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.5.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.6.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.7.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.8.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.9.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.10.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.11.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.12.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.13.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.14.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.15.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.16.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.17.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.18.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.19.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight": "model-00031-of-000163.safetensors", + "model.layers.14.mlp.experts.20.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.21.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.22.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.23.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.24.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.25.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.26.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.27.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.28.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.29.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.30.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.31.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.32.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.33.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.34.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.35.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.36.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.37.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.38.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.39.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.40.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.41.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.42.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.43.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.44.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.45.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.46.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.47.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.48.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.49.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.50.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.51.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.52.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.53.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.54.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.55.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.56.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.57.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.58.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.59.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.60.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.61.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.62.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.63.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.64.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.65.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.66.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.67.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.68.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.69.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.70.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.71.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.72.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.73.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.74.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.75.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.76.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.77.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.78.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.79.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.80.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.81.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.82.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.83.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.84.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.85.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.86.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.87.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.88.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.89.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.90.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.91.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.92.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.93.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.94.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.95.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.96.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.97.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.98.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.99.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.100.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.101.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.102.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.103.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.104.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.105.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.106.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.107.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.108.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.109.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.110.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.111.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.112.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.113.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.114.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.115.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.116.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.117.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight": "model-00032-of-000163.safetensors", + "model.layers.14.mlp.experts.118.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.118.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.119.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.120.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.121.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.122.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.123.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.124.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.125.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.126.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.127.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.128.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.129.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.130.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.131.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.132.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.133.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.134.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.135.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.136.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.137.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.138.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.139.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.140.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.141.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.142.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.143.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.144.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.145.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.146.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.147.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.148.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.149.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.150.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.151.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.152.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.153.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.154.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.155.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.156.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.157.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.158.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.159.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.160.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.161.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.162.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.163.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.164.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.165.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.166.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.167.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.168.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.169.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.170.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.171.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.172.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.173.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.174.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.175.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.176.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.177.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.178.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.179.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.180.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.181.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.182.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.183.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.184.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.185.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.186.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.187.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.188.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.189.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.190.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.191.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.192.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.193.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.194.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.195.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.196.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.197.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.198.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.199.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.200.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.201.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.202.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.203.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.204.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.205.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.206.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.207.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.208.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.209.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.210.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.211.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.212.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.213.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.214.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.up_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.down_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.215.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.216.gate_proj.weight": "model-00033-of-000163.safetensors", + "model.layers.14.mlp.experts.216.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.216.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.216.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.216.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.216.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.217.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.218.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.219.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.220.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.221.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.222.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.223.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.224.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.225.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.226.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.227.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.228.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.229.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.230.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.231.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.232.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.233.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.234.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.235.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.236.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.237.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.238.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.239.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.240.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.241.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.242.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.243.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.244.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.245.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.246.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.247.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.248.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.249.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.250.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.251.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.252.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.253.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.254.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.gate_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.up_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.down_proj.weight": "model-00034-of-000163.safetensors", + "model.layers.14.mlp.experts.255.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", + "model.layers.14.input_layernorm.weight": "model-00034-of-000163.safetensors", + "model.layers.14.post_attention_layernorm.weight": "model-00034-of-000163.safetensors", + "model.layers.15.self_attn.q_a_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.q_a_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.q_a_layernorm.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.q_b_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.q_b_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_a_proj_with_mqa.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_a_layernorm.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_b_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.kv_b_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.o_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.self_attn.o_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.gate.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.gate.e_score_correction_bias": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.shared_experts.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.0.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.1.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.2.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.3.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.4.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.5.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.6.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.7.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.8.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.9.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.10.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.11.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.12.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.13.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.14.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.15.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.16.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.17.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.18.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.19.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.20.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.21.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.22.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.23.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.24.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.25.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.26.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.27.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.28.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.29.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.30.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.31.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.32.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.33.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.34.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.35.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.36.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.37.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.38.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.39.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.40.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.41.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.42.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.43.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.44.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.45.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.46.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.47.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.48.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.49.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.50.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.51.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.52.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.53.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.54.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.55.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.56.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.57.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.58.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.59.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.60.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.61.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.62.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.63.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.64.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.65.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.66.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.67.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.68.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.69.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.70.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.71.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.72.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.73.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.74.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.75.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.76.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.77.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.78.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.79.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.80.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.81.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.82.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.83.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.84.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.85.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.86.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.87.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.88.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.89.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.90.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.91.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00035-of-000163.safetensors", + "model.layers.15.mlp.experts.92.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.92.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.92.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.93.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.94.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.95.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.96.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.97.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.98.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.99.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.100.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.101.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.102.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.103.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.104.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.105.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.106.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.107.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.108.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.109.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.110.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.111.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.112.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.113.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.114.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.115.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.116.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.117.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.118.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.119.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.120.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.121.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.122.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.123.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.124.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.125.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.126.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.127.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.128.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.129.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.130.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.131.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.132.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.133.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.134.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.135.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.136.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.137.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.138.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.139.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.140.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.141.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.142.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.143.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.144.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.145.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.146.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.147.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.148.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.149.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.150.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.151.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.152.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.153.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.154.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.155.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.156.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.157.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.158.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.159.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.160.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.161.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.162.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.163.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.164.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.165.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.166.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.167.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.168.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.169.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.170.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.171.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.172.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.173.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.174.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.175.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.176.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.177.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.178.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.179.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.180.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.181.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.182.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.183.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.184.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.185.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.186.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.187.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.188.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.gate_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.up_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.down_proj.weight": "model-00036-of-000163.safetensors", + "model.layers.15.mlp.experts.189.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.190.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.191.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.192.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.193.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.194.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.195.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.196.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.197.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.198.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.199.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.200.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.201.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.202.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.203.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.204.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.205.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.206.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.207.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.208.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.209.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.210.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.211.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.212.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.213.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.214.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.215.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.216.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.217.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.218.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.219.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.220.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.221.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.222.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.223.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.224.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.225.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.226.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.227.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.228.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.229.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.230.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.231.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.232.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.233.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.234.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.235.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.236.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.237.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.238.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.239.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.240.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.241.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.242.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.243.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.244.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.245.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.246.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.247.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.248.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.249.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.250.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.251.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.252.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.253.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.254.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.15.mlp.experts.255.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.15.input_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.15.post_attention_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_a_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_a_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_a_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_b_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.q_b_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_a_proj_with_mqa.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_a_layernorm.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_b_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.kv_b_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.o_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.self_attn.o_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.gate.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.gate.e_score_correction_bias": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.shared_experts.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.0.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.1.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.2.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.3.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.4.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.5.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.6.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.7.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.8.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.9.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.10.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.11.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.12.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.13.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.14.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.15.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.16.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.17.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.18.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.19.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.20.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.21.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.22.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.23.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.24.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.25.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00037-of-000163.safetensors", + "model.layers.16.mlp.experts.26.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.26.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.26.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.27.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.28.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.29.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.30.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.31.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.32.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.33.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.34.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.35.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.36.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.37.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.38.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.39.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.40.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.41.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.42.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.43.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.44.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.45.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.46.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.47.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.48.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.49.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.50.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.51.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.52.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.53.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.54.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.55.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.56.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.57.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.58.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.59.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.60.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.61.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.62.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.63.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.64.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.65.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.66.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.67.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.68.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.69.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.70.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.71.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.72.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.73.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.74.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.75.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.76.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.77.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.78.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.79.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.80.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.81.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.82.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.83.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.84.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.85.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.86.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.87.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.88.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.89.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.90.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.91.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.92.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.93.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.94.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.95.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.96.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.97.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.98.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.99.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.100.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.101.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.102.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.103.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.104.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.105.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.106.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.107.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.108.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.109.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.110.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.111.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.112.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.113.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.114.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.115.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.116.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.117.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.118.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.119.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.120.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.121.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.122.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight": "model-00038-of-000163.safetensors", + "model.layers.16.mlp.experts.123.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.124.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.125.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.126.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.127.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.128.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.129.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.130.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.131.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.132.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.133.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.134.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.135.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.136.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.137.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.138.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.139.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.140.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.141.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.142.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.143.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.144.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.145.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.146.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.147.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.148.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.149.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.150.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.151.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.152.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.153.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.154.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.155.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.156.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.157.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.158.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.159.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.160.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.161.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.162.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.163.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.164.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.165.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.166.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.167.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.168.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.169.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.170.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.171.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.172.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.173.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.174.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.175.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.176.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.177.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.178.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.179.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.180.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.181.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.182.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.183.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.184.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.185.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.186.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.187.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.188.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.189.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.190.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.191.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.192.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.193.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.194.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.195.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.196.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.197.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.198.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.199.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.200.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.201.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.202.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.203.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.204.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.205.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.206.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.207.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.208.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.209.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.210.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.211.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.212.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.213.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.214.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.215.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.216.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.217.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.218.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.219.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.down_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.220.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.gate_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.up_proj.weight": "model-00039-of-000163.safetensors", + "model.layers.16.mlp.experts.221.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.221.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.221.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.222.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.223.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.224.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.225.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.226.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.227.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.228.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.229.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.230.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.231.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.232.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.233.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.234.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.235.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.236.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.237.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.238.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.239.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.240.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.241.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.242.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.243.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.244.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.245.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.246.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.247.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.248.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.249.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.250.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.251.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.252.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.253.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.254.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.16.mlp.experts.255.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.16.input_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.16.post_attention_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_a_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_a_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_a_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_b_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.q_b_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_a_proj_with_mqa.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_a_layernorm.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_b_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.kv_b_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.o_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.self_attn.o_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.gate.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.gate.e_score_correction_bias": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.shared_experts.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.0.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.1.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.2.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.3.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.4.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.5.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.6.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.7.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.8.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.9.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.10.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.11.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.12.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.13.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.14.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.15.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.16.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.17.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.18.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.19.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.20.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.21.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.22.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.23.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.24.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.25.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.26.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.27.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.28.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.29.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.30.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.31.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.32.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.33.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.34.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.35.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.36.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.37.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.38.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.39.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.40.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.41.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.42.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.43.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.44.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.45.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.46.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.47.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.48.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.49.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.50.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.51.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.52.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.53.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.54.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.55.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.56.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight": "model-00040-of-000163.safetensors", + "model.layers.17.mlp.experts.57.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.58.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.59.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.60.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.61.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.62.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.63.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.64.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.65.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.66.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.67.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.68.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.69.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.70.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.71.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.72.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.73.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.74.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.75.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.76.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.77.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.78.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.79.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.80.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.81.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.82.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.83.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.84.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.85.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.86.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.87.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.88.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.89.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.90.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.91.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.92.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.93.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.94.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.95.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.96.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.97.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.98.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.99.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.100.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.101.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.102.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.103.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.104.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.105.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.106.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.107.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.108.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.109.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.110.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.111.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.112.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.113.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.114.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.115.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.116.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.117.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.118.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.119.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.120.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.121.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.122.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.123.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.124.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.125.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.126.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.127.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.128.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.129.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.130.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.131.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.132.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.133.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.134.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.135.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.136.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.137.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.138.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.139.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.140.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.141.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.142.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.143.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.144.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.145.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.146.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.147.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.148.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.149.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.150.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.151.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.152.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.153.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.down_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.154.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.up_proj.weight": "model-00041-of-000163.safetensors", + "model.layers.17.mlp.experts.155.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.155.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.156.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.157.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.158.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.159.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.160.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.161.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.162.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.163.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.164.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.165.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.166.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.167.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.168.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.169.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.170.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.171.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.172.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.173.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.174.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.175.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.176.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.177.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.178.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.179.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.180.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.181.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.182.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.183.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.184.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.185.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.186.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.187.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.188.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.189.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.190.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.191.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.192.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.193.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.194.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.195.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.196.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.197.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.198.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.199.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.200.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.201.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.202.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.203.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.204.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.205.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.206.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.207.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.208.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.209.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.210.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.211.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.212.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.213.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.214.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.215.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.216.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.217.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.218.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.219.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.220.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.221.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.222.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.223.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.224.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.225.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.226.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.227.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.228.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.229.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.230.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.231.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.232.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.233.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.234.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.235.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.236.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.237.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.238.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.239.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.240.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.241.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.242.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.243.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.244.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.245.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.246.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.247.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.248.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.249.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.250.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.251.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.up_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.252.down_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.253.gate_proj.weight": "model-00042-of-000163.safetensors", + "model.layers.17.mlp.experts.253.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.253.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.254.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.mlp.experts.255.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.17.input_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.17.post_attention_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_a_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_a_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.q_b_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_a_proj_with_mqa.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_a_layernorm.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.kv_b_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.self_attn.o_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.gate.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.gate.e_score_correction_bias": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.0.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.1.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.2.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.3.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.4.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.5.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.6.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.7.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.8.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.9.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.10.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.11.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.12.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.13.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.14.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.15.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.16.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.17.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.18.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.19.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.20.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.21.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.22.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.23.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.24.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.25.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.26.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.27.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.28.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.29.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.30.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.31.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.32.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.33.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.34.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.35.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.36.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.37.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.38.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.39.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.40.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.41.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.42.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.43.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.44.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.45.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.46.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.47.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.48.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.49.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.50.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.51.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.52.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.53.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.54.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.55.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.56.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.57.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.58.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.59.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.60.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.61.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.62.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.63.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.64.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.65.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.66.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.67.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.68.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.69.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.70.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.71.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.72.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.73.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.74.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.75.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.76.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.77.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.78.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.79.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.80.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.81.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.82.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.83.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.84.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.85.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.86.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.87.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.88.down_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.up_proj.weight": "model-00043-of-000163.safetensors", + "model.layers.18.mlp.experts.89.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.90.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.91.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.92.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.93.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.94.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.95.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.96.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.97.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.98.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.99.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.100.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.101.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.102.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.103.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.104.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.105.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.106.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.107.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.108.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.109.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.110.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.111.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.112.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.113.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.114.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.115.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.116.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.117.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.118.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.119.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.120.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.121.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.122.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.123.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.124.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.125.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.126.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.127.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.128.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.129.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.130.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.131.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.132.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.133.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.134.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.135.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.136.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.137.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.138.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.139.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.140.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.141.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.142.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.143.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.144.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.145.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.146.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.147.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.148.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.149.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.150.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.151.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.152.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.153.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.154.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.155.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.156.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.157.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.158.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.159.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.160.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.161.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.162.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.163.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.164.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.165.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.166.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.167.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.168.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.169.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.170.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.171.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.172.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.173.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.174.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.175.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.176.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.177.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.178.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.179.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.180.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.181.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.182.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.183.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.184.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.185.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.up_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.186.down_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.187.gate_proj.weight": "model-00044-of-000163.safetensors", + "model.layers.18.mlp.experts.187.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.187.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.188.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.189.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.190.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.191.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.192.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.193.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.194.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.195.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.196.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.197.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.198.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.199.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.200.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.201.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.202.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.203.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.204.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.205.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.206.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.207.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.208.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.209.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.210.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.211.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.212.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.213.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.214.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.215.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.216.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.217.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.218.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.219.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.220.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.221.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.222.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.223.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.224.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.225.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.226.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.227.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.228.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.229.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.230.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.231.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.232.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.233.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.234.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.235.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.236.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.237.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.238.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.239.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.240.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.241.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.242.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.243.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.244.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.245.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.246.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.247.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.248.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.249.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.250.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.251.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.252.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.253.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.254.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.mlp.experts.255.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.18.input_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.18.post_attention_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_a_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_a_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.q_b_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_a_proj_with_mqa.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_a_layernorm.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.kv_b_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.self_attn.o_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.gate.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.gate.e_score_correction_bias": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.0.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.1.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.2.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.3.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.4.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.5.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.6.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.7.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.8.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.9.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.10.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.11.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.12.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.13.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.14.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.15.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.16.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.17.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.18.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.19.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.20.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.21.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.22.down_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.up_proj.weight": "model-00045-of-000163.safetensors", + "model.layers.19.mlp.experts.23.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.24.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.25.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.26.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.27.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.28.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.29.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.30.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.31.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.32.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.33.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.34.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.35.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.36.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.37.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.38.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.39.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.40.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.41.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.42.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.43.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.44.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.45.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.46.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.47.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.48.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.49.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.50.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.51.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.52.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.53.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.54.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.55.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.56.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.57.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.58.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.59.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.60.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.61.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.62.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.63.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.64.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.65.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.66.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.67.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.68.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.69.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.70.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.71.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.72.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.73.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.74.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.75.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.76.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.77.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.78.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.79.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.80.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.81.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.82.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.83.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.84.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.85.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.86.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.87.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.88.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.89.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.90.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.91.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.92.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.93.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.94.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.95.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.96.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.97.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.98.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.99.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.100.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.101.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.102.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.103.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.104.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.105.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.106.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.107.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.108.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.109.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.110.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.111.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.112.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.113.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.114.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.115.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.116.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.117.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.118.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.119.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.up_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.120.down_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00046-of-000163.safetensors", + "model.layers.19.mlp.experts.121.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.121.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.122.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.123.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.124.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.125.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.126.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.127.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.128.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.129.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.130.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.131.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.132.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.133.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.134.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.135.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.136.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.137.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.138.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.139.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.140.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.141.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.142.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.143.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.144.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.145.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.146.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.147.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.148.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.149.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.150.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.151.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.152.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.153.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.154.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.155.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.156.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.157.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.158.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.159.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.160.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.161.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.162.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.163.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.164.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.165.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.166.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.167.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.168.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.169.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.170.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.171.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.172.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.173.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.174.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.175.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.176.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.177.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.178.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.179.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.180.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.181.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.182.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.183.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.184.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.185.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.186.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.187.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.188.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.189.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.190.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.191.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.192.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.193.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.194.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.195.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.196.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.197.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.198.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.199.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.200.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.201.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.202.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.203.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.204.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.205.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.206.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.207.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.208.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.209.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.210.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.211.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.212.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.213.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.214.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.215.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.216.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.217.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.gate_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.up_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.218.down_proj.weight": "model-00047-of-000163.safetensors", + "model.layers.19.mlp.experts.219.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.219.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.219.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.220.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.221.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.222.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.223.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.224.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.225.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.226.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.227.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.228.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.229.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.230.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.231.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.232.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.233.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.234.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.235.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.236.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.237.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.238.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.239.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.240.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.241.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.242.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.243.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.244.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.245.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.246.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.247.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.248.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.249.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.250.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.251.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.252.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.253.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.254.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.mlp.experts.255.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.19.input_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.19.post_attention_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_a_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_a_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.q_b_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_a_proj_with_mqa.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_a_layernorm.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.kv_b_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.self_attn.o_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.gate.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.gate.e_score_correction_bias": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.0.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.1.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.2.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.3.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.4.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.5.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.6.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.7.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.8.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.9.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.10.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.11.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.12.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.13.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.14.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.15.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.16.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.17.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.18.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.19.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.20.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.21.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.22.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.23.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.24.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.25.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.26.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.27.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.28.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.29.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.30.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.31.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.32.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.33.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.34.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.35.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.36.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.37.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.38.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.39.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.40.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.41.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.42.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.43.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.44.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.45.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.46.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.47.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.48.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.49.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.50.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.51.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.52.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.53.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.up_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.54.down_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00048-of-000163.safetensors", + "model.layers.20.mlp.experts.55.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.55.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.56.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.57.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.58.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.59.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.60.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.61.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.62.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.63.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.64.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.65.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.66.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.67.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.68.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.69.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.70.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.71.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.72.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.73.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.74.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.75.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.76.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.77.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.78.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.79.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.80.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.81.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.82.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.83.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.84.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.85.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.86.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.87.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.88.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.89.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.90.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.91.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.92.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.93.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.94.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.95.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.96.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.97.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.98.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.99.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.100.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.101.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.102.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.103.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.104.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.105.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.106.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.107.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.108.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.109.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.110.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.111.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.112.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.113.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.114.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.115.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.116.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.117.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.118.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.119.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.120.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.121.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.122.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.123.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.124.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.125.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.126.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.127.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.128.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.129.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.130.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.131.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.132.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.133.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.134.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.135.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.136.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.137.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.138.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.139.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.140.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.141.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.142.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.143.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.144.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.145.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.146.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.147.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.148.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.149.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.150.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.151.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.up_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.152.down_proj.weight": "model-00049-of-000163.safetensors", + "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.153.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.153.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.154.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.155.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.156.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.157.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.158.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.159.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.160.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.161.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.162.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.163.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.164.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.165.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.166.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.167.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.168.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.169.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.170.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.171.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.172.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.173.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.174.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.175.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.176.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.177.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.178.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.179.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.180.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.181.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.182.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.183.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.184.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.185.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.186.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.187.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.188.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.189.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.190.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.191.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.192.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.193.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.194.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.195.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.196.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.197.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.198.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.199.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.200.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.201.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.202.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.203.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.204.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.205.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.206.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.207.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.208.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.209.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.210.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.211.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.212.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.213.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.214.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.215.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.216.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.217.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.218.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.219.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.220.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.221.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.222.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.223.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.224.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.225.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.226.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.227.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.228.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.229.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.230.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.231.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.232.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.233.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.234.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.235.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.236.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.237.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.238.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.239.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.240.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.241.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.242.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.243.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.244.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.245.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.246.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.247.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.248.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.249.down_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.gate_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.up_proj.weight": "model-00050-of-000163.safetensors", + "model.layers.20.mlp.experts.250.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.251.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.252.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.253.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.254.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.mlp.experts.255.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.20.input_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.20.post_attention_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_a_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_a_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.q_b_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_a_proj_with_mqa.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_a_layernorm.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.kv_b_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.self_attn.o_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.gate.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.gate.e_score_correction_bias": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.0.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.1.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.2.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.3.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.4.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.5.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.6.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.7.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.8.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.9.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.10.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.11.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.12.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.13.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.14.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.15.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.16.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.17.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.18.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.19.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.20.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.21.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.22.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.23.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.24.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.25.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.26.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.27.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.28.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.29.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.30.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.31.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.32.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.33.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.34.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.35.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.36.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.37.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.38.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.39.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.40.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.41.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.42.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.43.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.44.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.45.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.46.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.47.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.48.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.49.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.50.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.51.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.52.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.53.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.54.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.55.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.56.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.57.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.58.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.59.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.60.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.61.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.62.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.63.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.64.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.65.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.66.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.67.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.68.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.69.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.70.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.71.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.72.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.73.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.74.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.75.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.76.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.77.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.78.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.79.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.80.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.81.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.82.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.83.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.84.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.85.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.up_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.86.down_proj.weight": "model-00051-of-000163.safetensors", + "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.87.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.87.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.88.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.89.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.90.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.91.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.92.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.93.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.94.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.95.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.96.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.97.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.98.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.99.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.100.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.101.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.102.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.103.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.104.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.105.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.106.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.107.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.108.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.109.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.110.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.111.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.112.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.113.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.114.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.115.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.116.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.117.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.118.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.119.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.120.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.121.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.122.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.123.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.124.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.125.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.126.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.127.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.128.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.129.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.130.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.131.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.132.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.133.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.134.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.135.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.136.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.137.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.138.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.139.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.140.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.141.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.142.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.143.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.144.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.145.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.146.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.147.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.148.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.149.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.150.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.151.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.152.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.153.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.154.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.155.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.156.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.157.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.158.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.159.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.160.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.161.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.162.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.163.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.164.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.165.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.166.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.167.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.168.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.169.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.170.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.171.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.172.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.173.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.174.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.175.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.176.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.177.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.178.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.179.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.180.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.181.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.182.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.183.down_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.gate_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.up_proj.weight": "model-00052-of-000163.safetensors", + "model.layers.21.mlp.experts.184.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.185.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.186.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.187.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.188.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.189.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.190.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.191.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.192.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.193.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.194.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.195.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.196.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.197.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.198.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.199.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.200.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.201.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.202.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.203.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.204.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.205.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.206.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.207.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.208.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.209.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.210.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.211.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.212.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.213.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.214.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.215.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.216.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.217.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.218.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.219.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.220.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.221.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.222.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.223.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.224.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.225.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.226.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.227.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.228.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.229.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.230.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.231.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.232.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.233.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.234.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.235.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.236.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.237.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.238.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.239.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.240.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.241.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.242.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.243.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.244.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.245.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.246.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.247.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.248.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.249.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.250.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.251.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.252.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.253.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.254.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.mlp.experts.255.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.21.input_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.21.post_attention_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_a_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_a_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.q_b_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_a_proj_with_mqa.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_a_layernorm.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.kv_b_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.self_attn.o_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.gate.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.gate.e_score_correction_bias": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.0.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.1.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.2.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.3.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.4.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.5.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.6.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.7.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.8.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.9.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.10.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.11.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.12.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.13.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.14.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.15.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.16.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.17.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.18.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.19.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.up_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.20.down_proj.weight": "model-00053-of-000163.safetensors", + "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.21.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.21.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.22.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.23.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.24.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.25.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.26.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.27.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.28.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.29.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.30.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.31.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.32.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.33.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.34.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.35.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.36.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.37.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.38.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.39.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.40.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.41.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.42.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.43.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.44.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.45.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.46.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.47.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.48.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.49.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.50.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.51.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.52.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.53.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.54.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.55.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.56.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.57.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.58.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.59.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.60.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.61.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.62.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.63.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.64.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.65.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.66.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.67.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.68.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.69.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.70.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.71.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.72.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.73.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.74.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.75.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.76.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.77.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.78.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.79.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.80.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.81.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.82.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.83.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.84.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.85.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.86.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.87.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.88.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.89.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.90.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.91.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.92.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.93.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.94.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.95.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.96.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.97.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.98.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.99.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.100.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.101.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.102.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.103.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.104.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.105.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.106.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.107.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.108.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.109.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.110.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.111.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.112.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.113.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.114.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.115.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.116.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.117.down_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.up_proj.weight": "model-00054-of-000163.safetensors", + "model.layers.22.mlp.experts.118.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.119.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.120.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.121.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.122.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.123.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.124.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.125.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.126.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.127.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.128.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.129.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.130.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.131.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.132.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.133.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.134.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.135.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.136.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.137.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.138.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.139.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.140.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.141.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.142.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.143.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.144.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.145.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.146.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.147.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.148.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.149.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.150.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.151.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.152.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.153.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.154.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.155.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.156.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.157.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.158.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.159.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.160.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.161.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.162.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.163.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.164.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.165.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.166.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.167.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.168.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.169.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.170.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.171.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.172.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.173.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.174.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.175.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.176.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.177.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.178.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.179.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.180.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.181.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.182.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.183.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.184.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.185.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.186.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.187.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.188.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.189.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.190.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.191.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.192.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.193.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.194.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.195.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.196.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.197.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.198.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.199.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.200.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.201.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.202.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.203.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.204.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.205.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.206.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.207.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.208.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.209.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.210.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.211.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.212.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.213.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.214.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.up_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.215.down_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.216.gate_proj.weight": "model-00055-of-000163.safetensors", + "model.layers.22.mlp.experts.216.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.216.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.217.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.218.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.219.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.220.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.221.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.222.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.223.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.224.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.225.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.226.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.227.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.228.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.229.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.230.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.231.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.232.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.233.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.234.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.235.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.236.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.237.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.238.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.239.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.240.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.241.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.242.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.243.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.244.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.245.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.246.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.247.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.248.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.249.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.250.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.251.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.252.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.253.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.254.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.gate_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.up_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.mlp.experts.255.down_proj.weight": "model-00056-of-000163.safetensors", + "model.layers.22.input_layernorm.weight": "model-00056-of-000163.safetensors", + "model.layers.22.post_attention_layernorm.weight": "model-00056-of-000163.safetensors", + "model.layers.23.self_attn.q_a_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.q_a_layernorm.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.q_b_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_a_proj_with_mqa.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_a_layernorm.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.kv_b_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.self_attn.o_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.gate.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.gate.e_score_correction_bias": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.0.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.1.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.2.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.3.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.4.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.5.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.6.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.7.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.8.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.9.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.10.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.11.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.12.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.13.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.14.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.15.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.16.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.17.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.18.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.19.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.20.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.21.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.22.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.23.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.24.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.25.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.26.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.27.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.28.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.29.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.30.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.31.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.32.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.33.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.34.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.35.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.36.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.37.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.38.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.39.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.40.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.41.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.42.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.43.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.44.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.45.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.46.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.47.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.48.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.49.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.50.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.51.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.52.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.53.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.54.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.55.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.56.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.57.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.58.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.59.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.60.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.61.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.62.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.63.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.64.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.65.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.66.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.67.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.68.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.69.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.70.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.71.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.72.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.73.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.74.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.75.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.76.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.77.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.78.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.79.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.80.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.81.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.82.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.83.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.84.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.85.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.86.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.87.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.88.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.89.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.90.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.up_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.91.down_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00057-of-000163.safetensors", + "model.layers.23.mlp.experts.92.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.92.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.93.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.94.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.95.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.96.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.97.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.98.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.99.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.100.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.101.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.102.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.103.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.104.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.105.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.106.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.107.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.108.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.109.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.110.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.111.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.112.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.113.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.114.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.115.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.116.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.117.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.118.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.119.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.120.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.121.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.122.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.123.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.124.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.125.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.126.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.127.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.128.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.129.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.130.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.131.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.132.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.133.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.134.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.135.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.136.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.137.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.138.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.139.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.140.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.141.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.142.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.143.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.144.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.145.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.146.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.147.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.148.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.149.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.150.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.151.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.152.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.153.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.154.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.155.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.156.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.157.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.158.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.159.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.160.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.161.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.162.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.163.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.164.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.165.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.166.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.167.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.168.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.169.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.170.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.171.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.172.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.173.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.174.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.175.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.176.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.177.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.178.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.179.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.180.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.181.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.182.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.183.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.184.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.185.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.186.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.187.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.188.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.gate_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.up_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.189.down_proj.weight": "model-00058-of-000163.safetensors", + "model.layers.23.mlp.experts.190.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.190.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.190.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.191.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.192.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.193.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.194.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.195.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.196.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.197.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.198.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.199.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.200.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.201.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.202.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.203.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.204.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.205.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.206.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.207.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.208.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.209.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.210.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.211.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.212.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.213.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.214.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.215.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.216.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.217.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.218.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.219.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.220.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.221.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.222.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.223.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.224.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.225.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.226.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.227.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.228.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.229.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.230.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.231.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.232.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.233.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.234.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.235.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.236.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.237.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.238.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.239.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.240.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.241.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.242.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.243.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.244.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.245.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.246.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.247.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.248.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.249.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.250.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.251.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.252.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.253.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.254.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.mlp.experts.255.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.23.input_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.23.post_attention_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_a_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_a_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.q_b_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_a_proj_with_mqa.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_a_layernorm.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.kv_b_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.self_attn.o_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.gate.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.gate.e_score_correction_bias": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.0.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.1.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.2.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.3.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.4.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.5.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.6.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.7.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.8.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.9.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.10.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.11.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.12.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.13.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.14.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.15.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.16.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.17.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.18.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.19.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.20.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.21.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.22.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.23.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.24.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.up_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.25.down_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00059-of-000163.safetensors", + "model.layers.24.mlp.experts.26.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.26.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.27.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.28.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.29.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.30.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.31.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.32.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.33.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.34.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.35.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.36.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.37.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.38.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.39.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.40.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.41.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.42.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.43.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.44.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.45.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.46.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.47.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.48.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.49.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.50.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.51.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.52.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.53.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.54.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.55.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.56.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.57.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.58.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.59.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.60.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.61.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.62.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.63.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.64.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.65.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.66.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.67.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.68.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.69.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.70.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.71.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.72.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.73.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.74.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.75.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.76.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.77.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.78.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.79.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.80.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.81.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.82.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.83.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.84.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.85.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.86.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.87.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.88.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.89.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.90.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.91.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.92.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.93.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.94.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.95.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.96.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.97.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.98.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.99.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.100.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.101.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.102.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.103.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.104.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.105.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.106.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.107.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.108.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.109.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.110.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.111.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.112.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.113.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.114.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.115.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.116.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.117.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.118.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.119.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.120.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.121.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.122.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.up_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.123.down_proj.weight": "model-00060-of-000163.safetensors", + "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.124.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.124.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.125.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.126.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.127.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.128.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.129.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.130.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.131.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.132.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.133.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.134.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.135.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.136.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.137.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.138.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.139.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.140.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.141.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.142.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.143.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.144.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.145.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.146.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.147.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.148.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.149.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.150.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.151.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.152.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.153.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.154.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.155.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.156.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.157.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.158.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.159.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.160.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.161.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.162.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.163.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.164.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.165.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.166.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.167.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.168.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.169.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.170.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.171.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.172.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.173.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.174.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.175.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.176.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.177.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.178.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.179.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.180.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.181.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.182.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.183.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.184.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.185.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.186.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.187.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.188.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.189.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.190.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.191.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.192.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.193.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.194.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.195.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.196.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.197.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.198.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.199.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.200.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.201.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.202.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.203.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.204.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.205.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.206.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.207.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.208.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.209.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.210.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.211.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.212.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.213.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.214.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.215.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.216.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.217.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.218.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.219.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.220.down_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.gate_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.up_proj.weight": "model-00061-of-000163.safetensors", + "model.layers.24.mlp.experts.221.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.222.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.223.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.224.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.225.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.226.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.227.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.228.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.229.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.230.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.231.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.232.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.233.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.234.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.235.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.236.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.237.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.238.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.239.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.240.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.241.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.242.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.243.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.244.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.245.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.246.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.247.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.248.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.249.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.250.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.251.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.252.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.253.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.254.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.mlp.experts.255.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.24.input_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.24.post_attention_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_a_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_a_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.q_b_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_a_proj_with_mqa.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_a_layernorm.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.kv_b_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.self_attn.o_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.gate.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.gate.e_score_correction_bias": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.0.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.1.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.2.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.3.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.4.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.5.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.6.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.7.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.8.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.9.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.10.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.11.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.12.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.13.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.14.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.15.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.16.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.17.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.18.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.19.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.20.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.21.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.22.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.23.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.24.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.25.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.26.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.27.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.28.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.29.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.30.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.31.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.32.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.33.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.34.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.35.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.36.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.37.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.38.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.39.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.40.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.41.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.42.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.43.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.44.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.45.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.46.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.47.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.48.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.49.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.50.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.51.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.52.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.53.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.54.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.55.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.56.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.up_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.57.down_proj.weight": "model-00062-of-000163.safetensors", + "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.58.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.58.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.59.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.60.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.61.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.62.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.63.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.64.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.65.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.66.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.67.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.68.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.69.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.70.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.71.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.72.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.73.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.74.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.75.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.76.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.77.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.78.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.79.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.80.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.81.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.82.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.83.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.84.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.85.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.86.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.87.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.88.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.89.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.90.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.91.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.92.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.93.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.94.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.95.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.96.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.97.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.98.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.99.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.100.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.101.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.102.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.103.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.104.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.105.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.106.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.107.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.108.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.109.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.110.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.111.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.112.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.113.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.114.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.115.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.116.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.117.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.118.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.119.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.120.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.121.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.122.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.123.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.124.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.125.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.126.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.127.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.128.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.129.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.130.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.131.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.132.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.133.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.134.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.135.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.136.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.137.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.138.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.139.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.140.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.141.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.142.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.143.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.144.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.145.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.146.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.147.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.148.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.149.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.150.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.151.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.152.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.153.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.154.down_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.up_proj.weight": "model-00063-of-000163.safetensors", + "model.layers.25.mlp.experts.155.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.156.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.157.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.158.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.159.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.160.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.161.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.162.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.163.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.164.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.165.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.166.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.167.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.168.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.169.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.170.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.171.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.172.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.173.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.174.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.175.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.176.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.177.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.178.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.179.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.180.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.181.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.182.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.183.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.184.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.185.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.186.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.187.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.188.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.189.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.190.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.191.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.192.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.193.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.194.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.195.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.196.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.197.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.198.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.199.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.200.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.201.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.202.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.203.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.204.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.205.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.206.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.207.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.208.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.209.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.210.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.211.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.212.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.213.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.214.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.215.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.216.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.217.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.218.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.219.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.220.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.221.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.222.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.223.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.224.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.225.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.226.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.227.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.228.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.229.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.230.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.231.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.232.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.233.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.234.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.235.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.236.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.237.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.238.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.239.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.240.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.241.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.242.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.243.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.244.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.245.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.246.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.247.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.248.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.249.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.250.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.251.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.up_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.252.down_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.253.gate_proj.weight": "model-00064-of-000163.safetensors", + "model.layers.25.mlp.experts.253.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.253.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.254.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.mlp.experts.255.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.25.input_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.25.post_attention_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_a_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_a_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.q_b_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_a_proj_with_mqa.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_a_layernorm.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.kv_b_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.self_attn.o_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.gate.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.gate.e_score_correction_bias": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.0.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.1.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.2.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.3.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.4.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.5.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.6.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.7.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.8.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.9.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.10.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.11.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.12.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.13.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.14.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.15.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.16.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.17.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.18.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.19.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.20.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.21.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.22.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.23.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.24.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.25.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.26.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.27.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.28.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.29.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.30.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.31.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.32.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.33.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.34.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.35.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.36.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.37.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.38.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.39.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.40.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.41.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.42.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.43.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.44.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.45.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.46.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.47.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.48.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.49.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.50.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.51.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.52.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.53.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.54.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.55.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.56.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.57.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.58.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.59.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.60.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.61.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.62.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.63.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.64.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.65.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.66.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.67.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.68.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.69.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.70.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.71.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.72.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.73.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.74.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.75.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.76.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.77.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.78.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.79.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.80.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.81.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.82.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.83.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.84.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.85.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.86.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.87.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.88.down_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.up_proj.weight": "model-00065-of-000163.safetensors", + "model.layers.26.mlp.experts.89.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.90.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.91.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.92.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.93.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.94.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.95.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.96.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.97.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.98.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.99.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.100.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.101.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.102.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.103.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.104.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.105.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.106.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.107.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.108.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.109.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.110.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.111.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.112.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.113.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.114.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.115.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.116.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.117.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.118.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.119.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.120.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.121.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.122.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.123.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.124.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.125.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.126.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.127.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.128.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.129.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.130.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.131.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.132.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.133.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.134.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.135.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.136.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.137.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.138.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.139.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.140.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.141.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.142.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.143.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.144.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.145.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.146.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.147.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.148.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.149.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.150.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.151.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.152.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.153.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.154.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.155.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.156.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.157.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.158.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.159.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.160.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.161.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.162.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.163.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.164.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.165.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.166.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.167.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.168.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.169.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.170.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.171.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.172.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.173.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.174.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.175.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.176.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.177.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.178.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.179.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.180.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.181.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.182.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.183.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.184.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.185.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.up_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.186.down_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.187.gate_proj.weight": "model-00066-of-000163.safetensors", + "model.layers.26.mlp.experts.187.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.187.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.188.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.189.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.190.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.191.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.192.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.193.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.194.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.195.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.196.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.197.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.198.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.199.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.200.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.201.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.202.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.203.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.204.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.205.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.206.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.207.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.208.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.209.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.210.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.211.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.212.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.213.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.214.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.215.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.216.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.217.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.218.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.219.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.220.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.221.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.222.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.223.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.224.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.225.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.226.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.227.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.228.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.229.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.230.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.231.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.232.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.233.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.234.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.235.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.236.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.237.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.238.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.239.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.240.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.241.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.242.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.243.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.244.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.245.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.246.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.247.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.248.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.249.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.250.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.251.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.252.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.253.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.254.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.mlp.experts.255.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.26.input_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.26.post_attention_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_a_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_a_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.q_b_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_a_proj_with_mqa.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_a_layernorm.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.kv_b_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.self_attn.o_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.gate.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.gate.e_score_correction_bias": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.0.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.1.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.2.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.3.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.4.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.5.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.6.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.7.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.8.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.9.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.10.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.11.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.12.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.13.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.14.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.15.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.16.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.17.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.18.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.19.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.20.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.21.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.22.down_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.up_proj.weight": "model-00067-of-000163.safetensors", + "model.layers.27.mlp.experts.23.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.24.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.25.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.26.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.27.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.28.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.29.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.30.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.31.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.32.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.33.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.34.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.35.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.36.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.37.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.38.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.39.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.40.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.41.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.42.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.43.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.44.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.45.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.46.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.47.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.48.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.49.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.50.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.51.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.52.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.53.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.54.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.55.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.56.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.57.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.58.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.59.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.60.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.61.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.62.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.63.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.64.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.65.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.66.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.67.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.68.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.69.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.70.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.71.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.72.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.73.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.74.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.75.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.76.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.77.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.78.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.79.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.80.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.81.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.82.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.83.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.84.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.85.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.86.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.87.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.88.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.89.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.90.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.91.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.92.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.93.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.94.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.95.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.96.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.97.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.98.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.99.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.100.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.101.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.102.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.103.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.104.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.105.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.106.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.107.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.108.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.109.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.110.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.111.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.112.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.113.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.114.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.115.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.116.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.117.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.118.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.119.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.up_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.120.down_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00068-of-000163.safetensors", + "model.layers.27.mlp.experts.121.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.121.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.122.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.123.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.124.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.125.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.126.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.127.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.128.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.129.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.130.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.131.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.132.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.133.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.134.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.135.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.136.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.137.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.138.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.139.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.140.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.141.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.142.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.143.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.144.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.145.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.146.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.147.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.148.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.149.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.150.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.151.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.152.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.153.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.154.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.155.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.156.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.157.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.158.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.159.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.160.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.161.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.162.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.163.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.164.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.165.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.166.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.167.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.168.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.169.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.170.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.171.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.172.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.173.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.174.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.175.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.176.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.177.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.178.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.179.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.180.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.181.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.182.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.183.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.184.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.185.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.186.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.187.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.188.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.189.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.190.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.191.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.192.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.193.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.194.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.195.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.196.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.197.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.198.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.199.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.200.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.201.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.202.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.203.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.204.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.205.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.206.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.207.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.208.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.209.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.210.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.211.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.212.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.213.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.214.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.215.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.216.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.217.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.gate_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.up_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.218.down_proj.weight": "model-00069-of-000163.safetensors", + "model.layers.27.mlp.experts.219.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.219.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.219.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.220.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.221.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.222.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.223.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.224.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.225.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.226.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.227.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.228.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.229.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.230.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.231.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.232.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.233.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.234.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.235.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.236.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.237.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.238.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.239.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.240.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.241.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.242.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.243.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.244.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.245.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.246.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.247.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.248.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.249.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.250.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.251.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.252.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.253.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.254.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.mlp.experts.255.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.27.input_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.27.post_attention_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_a_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_a_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.q_b_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_a_proj_with_mqa.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_a_layernorm.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.kv_b_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.self_attn.o_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.gate.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.gate.e_score_correction_bias": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.0.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.1.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.2.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.3.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.4.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.5.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.6.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.7.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.8.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.9.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.10.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.11.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.12.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.13.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.14.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.15.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.16.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.17.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.18.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.19.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.20.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.21.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.22.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.23.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.24.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.25.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.26.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.27.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.28.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.29.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.30.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.31.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.32.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.33.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.34.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.35.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.36.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.37.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.38.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.39.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.40.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.41.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.42.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.43.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.44.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.45.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.46.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.47.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.48.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.49.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.50.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.51.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.52.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.53.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.up_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.54.down_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00070-of-000163.safetensors", + "model.layers.28.mlp.experts.55.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.55.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.56.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.57.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.58.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.59.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.60.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.61.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.62.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.63.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.64.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.65.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.66.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.67.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.68.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.69.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.70.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.71.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.72.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.73.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.74.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.75.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.76.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.77.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.78.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.79.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.80.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.81.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.82.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.83.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.84.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.85.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.86.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.87.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.88.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.89.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.90.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.91.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.92.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.93.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.94.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.95.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.96.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.97.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.98.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.99.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.100.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.101.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.102.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.103.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.104.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.105.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.106.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.107.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.108.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.109.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.110.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.111.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.112.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.113.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.114.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.115.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.116.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.117.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.118.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.119.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.120.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.121.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.122.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.123.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.124.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.125.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.126.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.127.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.128.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.129.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.130.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.131.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.132.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.133.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.134.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.135.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.136.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.137.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.138.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.139.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.140.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.141.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.142.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.143.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.144.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.145.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.146.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.147.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.148.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.149.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.150.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.151.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.up_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.152.down_proj.weight": "model-00071-of-000163.safetensors", + "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.153.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.153.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.154.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.155.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.156.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.157.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.158.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.159.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.160.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.161.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.162.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.163.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.164.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.165.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.166.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.167.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.168.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.169.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.170.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.171.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.172.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.173.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.174.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.175.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.176.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.177.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.178.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.179.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.180.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.181.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.182.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.183.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.184.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.185.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.186.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.187.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.188.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.189.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.190.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.191.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.192.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.193.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.194.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.195.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.196.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.197.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.198.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.199.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.200.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.201.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.202.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.203.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.204.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.205.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.206.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.207.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.208.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.209.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.210.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.211.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.212.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.213.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.214.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.215.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.216.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.217.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.218.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.219.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.220.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.221.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.222.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.223.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.224.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.225.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.226.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.227.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.228.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.229.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.230.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.231.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.232.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.233.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.234.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.235.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.236.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.237.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.238.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.239.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.240.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.241.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.242.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.243.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.244.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.245.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.246.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.247.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.248.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.249.down_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.gate_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.up_proj.weight": "model-00072-of-000163.safetensors", + "model.layers.28.mlp.experts.250.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.251.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.252.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.253.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.254.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.mlp.experts.255.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.28.input_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.28.post_attention_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_a_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_a_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.q_b_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_a_proj_with_mqa.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_a_layernorm.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.kv_b_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.self_attn.o_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.gate.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.gate.e_score_correction_bias": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.0.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.1.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.2.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.3.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.4.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.5.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.6.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.7.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.8.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.9.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.10.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.11.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.12.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.13.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.14.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.15.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.16.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.17.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.18.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.19.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.20.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.21.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.22.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.23.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.24.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.25.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.26.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.27.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.28.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.29.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.30.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.31.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.32.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.33.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.34.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.35.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.36.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.37.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.38.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.39.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.40.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.41.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.42.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.43.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.44.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.45.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.46.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.47.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.48.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.49.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.50.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.51.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.52.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.53.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.54.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.55.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.56.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.57.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.58.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.59.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.60.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.61.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.62.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.63.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.64.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.65.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.66.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.67.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.68.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.69.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.70.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.71.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.72.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.73.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.74.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.75.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.76.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.77.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.78.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.79.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.80.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.81.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.82.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.83.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.84.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.85.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.up_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.86.down_proj.weight": "model-00073-of-000163.safetensors", + "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.87.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.87.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.88.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.89.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.90.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.91.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.92.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.93.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.94.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.95.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.96.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.97.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.98.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.99.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.100.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.101.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.102.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.103.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.104.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.105.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.106.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.107.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.108.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.109.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.110.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.111.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.112.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.113.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.114.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.115.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.116.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.117.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.118.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.119.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.120.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.121.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.122.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.123.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.124.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.125.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.126.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.127.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.128.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.129.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.130.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.131.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.132.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.133.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.134.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.135.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.136.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.137.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.138.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.139.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.140.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.141.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.142.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.143.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.144.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.145.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.146.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.147.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.148.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.149.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.150.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.151.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.152.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.153.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.154.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.155.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.156.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.157.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.158.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.159.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.160.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.161.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.162.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.163.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.164.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.165.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.166.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.167.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.168.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.169.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.170.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.171.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.172.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.173.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.174.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.175.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.176.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.177.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.178.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.179.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.180.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.181.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.182.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.183.down_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.gate_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.up_proj.weight": "model-00074-of-000163.safetensors", + "model.layers.29.mlp.experts.184.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.185.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.186.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.187.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.188.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.189.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.190.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.191.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.192.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.193.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.194.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.195.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.196.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.197.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.198.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.199.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.200.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.201.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.202.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.203.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.204.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.205.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.206.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.207.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.208.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.209.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.210.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.211.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.212.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.213.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.214.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.215.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.216.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.217.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.218.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.219.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.220.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.221.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.222.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.223.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.224.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.225.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.226.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.227.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.228.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.229.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.230.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.231.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.232.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.233.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.234.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.235.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.236.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.237.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.238.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.239.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.240.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.241.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.242.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.243.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.244.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.245.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.246.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.247.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.248.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.249.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.250.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.251.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.252.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.253.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.254.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.mlp.experts.255.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.29.input_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.29.post_attention_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_a_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_a_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.q_b_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_a_proj_with_mqa.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_a_layernorm.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.kv_b_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.self_attn.o_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.gate.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.gate.e_score_correction_bias": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.0.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.1.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.2.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.3.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.4.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.5.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.6.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.7.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.8.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.9.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.10.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.11.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.12.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.13.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.14.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.15.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.16.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.17.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.18.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.19.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.up_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.20.down_proj.weight": "model-00075-of-000163.safetensors", + "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.21.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.21.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.22.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.23.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.24.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.25.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.26.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.27.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.28.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.29.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.30.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.31.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.32.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.33.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.34.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.35.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.36.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.37.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.38.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.39.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.40.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.41.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.42.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.43.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.44.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.45.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.46.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.47.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.48.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.49.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.50.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.51.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.52.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.53.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.54.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.55.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.56.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.57.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.58.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.59.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.60.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.61.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.62.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.63.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.64.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.65.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.66.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.67.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.68.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.69.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.70.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.71.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.72.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.73.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.74.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.75.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.76.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.77.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.78.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.79.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.80.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.81.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.82.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.83.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.84.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.85.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.86.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.87.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.88.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.89.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.90.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.91.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.92.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.93.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.94.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.95.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.96.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.97.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.98.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.99.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.100.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.101.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.102.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.103.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.104.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.105.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.106.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.107.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.108.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.109.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.110.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.111.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.112.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.113.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.114.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.115.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.116.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.117.down_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.up_proj.weight": "model-00076-of-000163.safetensors", + "model.layers.30.mlp.experts.118.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.119.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.120.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.121.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.122.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.123.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.124.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.125.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.126.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.127.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.128.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.129.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.130.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.131.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.132.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.133.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.134.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.135.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.136.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.137.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.138.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.139.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.140.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.141.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.142.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.143.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.144.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.145.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.146.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.147.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.148.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.149.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.150.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.151.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.152.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.153.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.154.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.155.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.156.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.157.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.158.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.159.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.160.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.161.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.162.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.163.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.164.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.165.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.166.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.167.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.168.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.169.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.170.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.171.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.172.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.173.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.174.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.175.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.176.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.177.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.178.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.179.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.180.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.181.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.182.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.183.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.184.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.185.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.186.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.187.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.188.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.189.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.190.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.191.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.192.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.193.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.194.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.195.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.196.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.197.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.198.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.199.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.200.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.201.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.202.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.203.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.204.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.205.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.206.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.207.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.208.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.209.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.210.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.211.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.212.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.213.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.214.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.up_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.215.down_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.216.gate_proj.weight": "model-00077-of-000163.safetensors", + "model.layers.30.mlp.experts.216.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.216.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.217.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.218.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.219.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.220.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.221.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.222.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.223.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.224.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.225.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.226.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.227.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.228.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.229.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.230.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.231.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.232.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.233.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.234.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.235.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.236.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.237.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.238.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.239.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.240.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.241.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.242.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.243.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.244.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.245.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.246.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.247.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.248.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.249.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.250.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.251.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.252.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.253.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.254.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.gate_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.up_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.mlp.experts.255.down_proj.weight": "model-00078-of-000163.safetensors", + "model.layers.30.input_layernorm.weight": "model-00078-of-000163.safetensors", + "model.layers.30.post_attention_layernorm.weight": "model-00078-of-000163.safetensors", + "model.layers.31.self_attn.q_a_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.q_a_layernorm.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.q_b_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_a_proj_with_mqa.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_a_layernorm.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.kv_b_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.self_attn.o_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.gate.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.gate.e_score_correction_bias": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.0.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.1.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.2.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.3.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.4.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.5.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.6.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.7.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.8.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.9.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.10.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.11.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.12.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.13.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.14.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.15.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.16.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.17.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.18.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.19.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.20.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.21.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.22.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.23.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.24.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.25.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.26.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.27.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.28.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.29.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.30.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.31.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.32.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.33.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.34.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.35.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.36.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.37.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.38.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.39.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.40.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.41.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.42.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.43.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.44.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.45.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.46.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.47.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.48.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.49.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.50.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.51.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.52.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.53.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.54.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.55.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.56.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.57.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.58.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.59.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.60.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.61.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.62.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.63.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.64.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.65.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.66.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.67.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.68.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.69.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.70.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.71.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.72.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.73.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.74.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.75.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.76.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.77.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.78.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.79.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.80.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.81.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.82.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.83.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.84.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.85.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.86.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.87.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.88.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.89.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.90.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.up_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.91.down_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00079-of-000163.safetensors", + "model.layers.31.mlp.experts.92.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.92.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.93.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.94.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.95.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.96.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.97.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.98.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.99.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.100.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.101.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.102.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.103.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.104.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.105.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.106.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.107.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.108.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.109.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.110.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.111.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.112.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.113.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.114.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.115.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.116.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.117.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.118.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.119.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.120.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.121.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.122.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.123.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.124.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.125.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.126.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.127.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.128.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.129.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.130.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.131.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.132.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.133.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.134.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.135.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.136.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.137.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.138.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.139.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.140.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.141.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.142.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.143.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.144.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.145.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.146.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.147.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.148.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.149.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.150.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.151.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.152.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.153.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.154.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.155.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.156.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.157.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.158.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.159.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.160.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.161.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.162.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.163.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.164.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.165.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.166.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.167.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.168.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.169.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.170.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.171.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.172.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.173.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.174.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.175.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.176.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.177.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.178.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.179.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.180.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.181.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.182.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.183.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.184.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.185.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.186.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.187.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.188.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.gate_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.up_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.189.down_proj.weight": "model-00080-of-000163.safetensors", + "model.layers.31.mlp.experts.190.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.190.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.190.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.191.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.192.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.193.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.194.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.195.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.196.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.197.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.198.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.199.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.200.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.201.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.202.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.203.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.204.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.205.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.206.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.207.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.208.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.209.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.210.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.211.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.212.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.213.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.214.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.215.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.216.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.217.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.218.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.219.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.220.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.221.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.222.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.223.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.224.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.225.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.226.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.227.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.228.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.229.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.230.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.231.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.232.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.233.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.234.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.235.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.236.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.237.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.238.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.239.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.240.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.241.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.242.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.243.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.244.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.245.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.246.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.247.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.248.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.249.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.250.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.251.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.252.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.253.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.254.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.mlp.experts.255.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.31.input_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.31.post_attention_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_a_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_a_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.q_b_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_a_proj_with_mqa.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_a_layernorm.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.kv_b_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.self_attn.o_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.gate.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.gate.e_score_correction_bias": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.0.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.1.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.2.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.3.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.4.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.5.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.6.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.7.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.8.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.9.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.10.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.11.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.12.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.13.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.14.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.15.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.16.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.17.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.18.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.19.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.20.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.21.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.22.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.23.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.24.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.up_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.25.down_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00081-of-000163.safetensors", + "model.layers.32.mlp.experts.26.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.26.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.27.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.28.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.29.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.30.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.31.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.32.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.33.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.34.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.35.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.36.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.37.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.38.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.39.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.40.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.41.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.42.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.43.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.44.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.45.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.46.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.47.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.48.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.49.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.50.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.51.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.52.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.53.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.54.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.55.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.56.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.57.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.58.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.59.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.60.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.61.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.62.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.63.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.64.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.65.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.66.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.67.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.68.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.69.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.70.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.71.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.72.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.73.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.74.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.75.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.76.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.77.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.78.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.79.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.80.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.81.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.82.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.83.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.84.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.85.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.86.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.87.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.88.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.89.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.90.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.91.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.92.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.93.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.94.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.95.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.96.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.97.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.98.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.99.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.100.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.101.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.102.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.103.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.104.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.105.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.106.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.107.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.108.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.109.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.110.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.111.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.112.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.113.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.114.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.115.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.116.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.117.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.118.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.119.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.120.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.121.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.122.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.up_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.123.down_proj.weight": "model-00082-of-000163.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.124.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.124.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.124.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.125.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.126.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.127.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.128.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.129.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.130.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.131.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.132.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.133.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.134.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.135.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.136.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.137.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.138.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.139.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.140.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.141.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.142.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.143.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.144.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.145.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.146.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.147.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.148.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.149.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.150.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.151.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.152.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.153.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.154.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.155.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.156.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.157.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.158.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.159.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.160.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.161.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.162.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.163.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.164.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.165.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.166.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.167.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.168.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.169.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.170.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.171.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.172.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.173.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.174.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.175.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.176.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.177.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.178.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.179.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.180.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.181.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.182.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.183.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.184.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.185.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.186.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.187.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.188.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.189.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.190.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.191.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.192.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.193.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.194.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.195.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.196.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.197.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.198.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.199.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.200.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.201.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.202.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.203.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.204.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.205.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.206.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.207.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.208.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.209.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.210.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.211.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.212.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.213.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.214.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.215.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.216.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.217.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.218.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.219.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.down_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.220.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.gate_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.up_proj.weight": "model-00083-of-000163.safetensors", + "model.layers.32.mlp.experts.221.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.221.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.221.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.222.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.223.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.224.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.225.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.226.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.227.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.228.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.229.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.230.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.231.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.232.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.233.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.234.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.235.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.236.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.237.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.238.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.239.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.240.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.241.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.242.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.243.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.244.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.245.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.246.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.247.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.248.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.249.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.250.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.251.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.252.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.253.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.254.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.32.mlp.experts.255.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.32.input_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.32.post_attention_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_a_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_a_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_a_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_b_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.q_b_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_a_proj_with_mqa.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_a_layernorm.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_b_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.kv_b_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.o_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.self_attn.o_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.gate.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.gate.e_score_correction_bias": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.shared_experts.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.0.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.1.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.2.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.3.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.4.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.5.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.6.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.7.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.8.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.9.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.10.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.11.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.12.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.13.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.14.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.15.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.16.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.17.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.18.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.19.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.20.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.21.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.22.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.23.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.24.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.25.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.26.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.27.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.28.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.29.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.30.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.31.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.32.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.33.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.34.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.35.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.36.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.37.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.38.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.39.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.40.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.41.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.42.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.43.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.44.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.45.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.46.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.47.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.48.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.49.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.50.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.51.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.52.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.53.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.54.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.55.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.56.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight": "model-00084-of-000163.safetensors", + "model.layers.33.mlp.experts.57.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.58.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.59.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.60.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.61.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.62.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.63.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.64.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.65.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.66.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.67.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.68.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.69.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.70.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.71.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.72.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.73.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.74.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.75.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.76.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.77.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.78.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.79.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.80.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.81.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.82.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.83.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.84.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.85.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.86.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.87.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.88.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.89.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.90.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.91.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.92.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.93.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.94.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.95.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.96.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.97.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.98.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.99.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.100.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.101.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.102.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.103.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.104.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.105.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.106.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.107.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.108.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.109.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.110.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.111.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.112.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.113.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.114.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.115.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.116.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.117.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.118.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.119.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.120.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.121.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.122.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.123.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.124.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.125.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.126.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.127.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.128.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.129.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.130.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.131.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.132.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.133.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.134.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.135.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.136.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.137.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.138.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.139.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.140.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.141.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.142.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.143.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.144.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.145.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.146.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.147.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.148.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.149.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.150.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.151.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.152.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.153.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.down_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.154.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.up_proj.weight": "model-00085-of-000163.safetensors", + "model.layers.33.mlp.experts.155.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.155.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.155.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.156.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.157.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.158.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.159.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.160.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.161.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.162.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.163.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.164.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.165.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.166.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.167.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.168.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.169.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.170.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.171.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.172.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.173.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.174.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.175.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.176.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.177.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.178.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.179.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.180.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.181.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.182.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.183.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.184.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.185.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.186.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.187.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.188.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.189.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.190.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.191.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.192.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.193.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.194.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.195.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.196.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.197.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.198.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.199.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.200.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.201.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.202.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.203.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.204.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.205.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.206.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.207.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.208.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.209.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.210.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.211.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.212.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.213.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.214.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.215.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.216.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.217.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.218.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.219.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.220.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.221.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.222.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.223.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.224.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.225.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.226.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.227.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.228.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.229.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.230.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.231.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.232.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.233.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.234.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.235.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.236.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.237.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.238.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.239.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.240.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.241.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.242.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.243.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.244.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.245.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.246.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.247.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.248.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.249.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.250.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.251.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.up_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.down_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.252.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.253.gate_proj.weight": "model-00086-of-000163.safetensors", + "model.layers.33.mlp.experts.253.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.253.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.253.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.253.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.253.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.254.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.33.mlp.experts.255.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.33.input_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.33.post_attention_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_a_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_a_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_a_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_b_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.q_b_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_a_proj_with_mqa.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_a_layernorm.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_b_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.kv_b_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.o_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.self_attn.o_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.gate.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.gate.e_score_correction_bias": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.shared_experts.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.0.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.1.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.2.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.3.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.4.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.5.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.6.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.7.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.8.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.9.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.10.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.11.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.12.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.13.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.14.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.15.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.16.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.17.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.18.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.19.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.20.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.21.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.22.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.23.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.24.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.25.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.26.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.27.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.28.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.29.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.30.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.31.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.32.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.33.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.34.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.35.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.36.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.37.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.38.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.39.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.40.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.41.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.42.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.43.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.44.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.45.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.46.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.47.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.48.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.49.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.50.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.51.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.52.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.53.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.54.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.55.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.56.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.57.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.58.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.59.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.60.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.61.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.62.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.63.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.64.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.65.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.66.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.67.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.68.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.69.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.70.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.71.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.72.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.73.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.74.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.75.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.76.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.77.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.78.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.79.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.80.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.81.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.82.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.83.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.84.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.85.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.86.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.87.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.88.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight": "model-00087-of-000163.safetensors", + "model.layers.34.mlp.experts.89.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.89.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.90.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.91.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.92.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.93.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.94.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.95.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.96.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.97.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.98.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.99.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.100.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.101.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.102.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.103.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.104.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.105.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.106.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.107.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.108.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.109.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.110.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.111.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.112.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.113.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.114.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.115.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.116.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.117.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.118.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.119.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.120.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.121.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.122.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.123.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.124.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.125.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.126.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.127.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.128.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.129.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.130.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.131.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.132.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.133.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.134.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.135.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.136.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.137.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.138.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.139.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.140.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.141.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.142.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.143.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.144.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.145.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.146.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.147.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.148.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.149.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.150.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.151.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.152.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.153.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.154.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.155.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.156.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.157.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.158.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.159.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.160.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.161.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.162.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.163.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.164.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.165.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.166.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.167.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.168.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.169.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.170.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.171.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.172.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.173.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.174.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.175.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.176.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.177.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.178.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.179.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.180.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.181.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.182.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.183.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.184.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.185.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.up_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.down_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.186.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.187.gate_proj.weight": "model-00088-of-000163.safetensors", + "model.layers.34.mlp.experts.187.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.187.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.187.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.187.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.187.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.188.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.189.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.190.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.191.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.192.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.193.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.194.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.195.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.196.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.197.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.198.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.199.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.200.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.201.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.202.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.203.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.204.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.205.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.206.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.207.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.208.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.209.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.210.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.211.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.212.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.213.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.214.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.215.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.216.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.217.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.218.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.219.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.220.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.221.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.222.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.223.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.224.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.225.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.226.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.227.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.228.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.229.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.230.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.231.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.232.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.233.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.234.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.235.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.236.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.237.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.238.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.239.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.240.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.241.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.242.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.243.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.244.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.245.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.246.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.247.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.248.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.249.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.250.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.251.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.252.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.253.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.254.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.34.mlp.experts.255.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.34.input_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.34.post_attention_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_a_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_a_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_a_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_b_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.q_b_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_a_proj_with_mqa.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_a_layernorm.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_b_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.kv_b_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.o_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.self_attn.o_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.gate.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.gate.e_score_correction_bias": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.shared_experts.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.0.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.1.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.2.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.3.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.4.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.5.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.6.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.7.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.8.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.9.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.10.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.11.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.12.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.13.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.14.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.15.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.16.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.17.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.18.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.19.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.20.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.21.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.22.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight": "model-00089-of-000163.safetensors", + "model.layers.35.mlp.experts.23.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.23.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.24.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.25.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.26.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.27.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.28.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.29.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.30.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.31.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.32.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.33.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.34.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.35.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.36.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.37.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.38.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.39.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.40.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.41.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.42.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.43.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.44.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.45.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.46.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.47.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.48.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.49.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.50.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.51.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.52.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.53.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.54.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.55.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.56.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.57.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.58.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.59.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.60.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.61.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.62.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.63.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.64.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.65.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.66.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.67.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.68.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.69.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.70.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.71.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.72.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.73.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.74.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.75.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.76.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.77.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.78.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.79.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.80.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.81.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.82.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.83.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.84.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.85.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.86.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.87.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.88.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.89.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.90.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.91.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.92.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.93.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.94.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.95.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.96.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.97.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.98.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.99.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.100.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.101.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.102.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.103.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.104.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.105.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.106.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.107.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.108.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.109.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.110.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.111.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.112.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.113.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.114.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.115.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.116.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.117.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.118.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.119.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.120.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00090-of-000163.safetensors", + "model.layers.35.mlp.experts.121.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.121.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.121.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.122.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.123.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.124.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.125.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.126.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.127.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.128.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.129.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.130.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.131.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.132.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.133.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.134.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.135.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.136.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.137.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.138.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.139.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.140.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.141.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.142.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.143.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.144.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.145.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.146.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.147.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.148.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.149.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.150.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.151.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.152.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.153.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.154.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.155.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.156.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.157.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.158.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.159.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.160.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.161.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.162.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.163.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.164.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.165.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.166.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.167.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.168.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.169.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.170.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.171.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.172.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.173.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.174.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.175.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.176.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.177.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.178.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.179.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.180.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.181.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.182.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.183.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.184.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.185.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.186.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.187.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.188.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.189.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.190.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.191.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.192.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.193.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.194.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.195.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.196.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.197.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.198.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.199.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.200.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.201.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.202.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.203.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.204.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.205.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.206.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.207.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.208.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.209.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.210.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.211.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.212.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.213.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.214.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.215.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.216.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.217.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.gate_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.up_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.down_proj.weight": "model-00091-of-000163.safetensors", + "model.layers.35.mlp.experts.218.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.219.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.220.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.221.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.222.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.223.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.224.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.225.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.226.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.227.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.228.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.229.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.230.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.231.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.232.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.233.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.234.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.235.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.236.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.237.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.238.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.239.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.240.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.241.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.242.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.243.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.244.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.245.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.246.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.247.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.248.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.249.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.250.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.251.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.252.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.253.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.254.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.35.mlp.experts.255.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.35.input_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.35.post_attention_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_a_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_a_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_a_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_b_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.q_b_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_a_proj_with_mqa.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_a_layernorm.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_b_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.kv_b_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.o_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.self_attn.o_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.gate.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.gate.e_score_correction_bias": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.shared_experts.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.0.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.1.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.2.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.3.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.4.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.5.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.6.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.7.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.8.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.9.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.10.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.11.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.12.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.13.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.14.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.15.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.16.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.17.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.18.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.19.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.20.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.21.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.22.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.23.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.24.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.25.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.26.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.27.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.28.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.29.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.30.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.31.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.32.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.33.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.34.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.35.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.36.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.37.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.38.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.39.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.40.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.41.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.42.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.43.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.44.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.45.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.46.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.47.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.48.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.49.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.50.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.51.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.52.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.53.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.54.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00092-of-000163.safetensors", + "model.layers.36.mlp.experts.55.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.55.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.55.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.56.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.57.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.58.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.59.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.60.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.61.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.62.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.63.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.64.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.65.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.66.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.67.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.68.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.69.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.70.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.71.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.72.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.73.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.74.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.75.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.76.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.77.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.78.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.79.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.80.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.81.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.82.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.83.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.84.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.85.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.86.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.87.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.88.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.89.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.90.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.91.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.92.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.93.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.94.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.95.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.96.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.97.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.98.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.99.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.100.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.101.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.102.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.103.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.104.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.105.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.106.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.107.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.108.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.109.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.110.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.111.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.112.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.113.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.114.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.115.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.116.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.117.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.118.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.119.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.120.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.121.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.122.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.123.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.124.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.125.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.126.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.127.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.128.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.129.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.130.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.131.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.132.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.133.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.134.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.135.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.136.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.137.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.138.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.139.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.140.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.141.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.142.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.143.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.144.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.145.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.146.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.147.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.148.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.149.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.150.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.151.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.up_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.down_proj.weight": "model-00093-of-000163.safetensors", + "model.layers.36.mlp.experts.152.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.153.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.154.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.155.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.156.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.157.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.158.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.159.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.160.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.161.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.162.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.163.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.164.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.165.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.166.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.167.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.168.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.169.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.170.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.171.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.172.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.173.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.174.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.175.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.176.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.177.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.178.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.179.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.180.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.181.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.182.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.183.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.184.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.185.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.186.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.187.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.188.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.189.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.190.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.191.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.192.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.193.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.194.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.195.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.196.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.197.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.198.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.199.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.200.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.201.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.202.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.203.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.204.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.205.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.206.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.207.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.208.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.209.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.210.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.211.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.212.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.213.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.214.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.215.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.216.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.217.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.218.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.219.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.220.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.221.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.222.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.223.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.224.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.225.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.226.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.227.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.228.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.229.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.230.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.231.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.232.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.233.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.234.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.235.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.236.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.237.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.238.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.239.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.240.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.241.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.242.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.243.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.244.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.245.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.246.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.247.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.248.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.down_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.249.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.gate_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.up_proj.weight": "model-00094-of-000163.safetensors", + "model.layers.36.mlp.experts.250.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.250.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.250.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.251.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.252.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.253.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.254.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.36.mlp.experts.255.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.36.input_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.36.post_attention_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_a_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_a_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_a_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_b_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.q_b_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_a_proj_with_mqa.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_a_layernorm.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_b_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.kv_b_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.o_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.self_attn.o_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.gate.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.gate.e_score_correction_bias": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.shared_experts.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.0.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.1.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.2.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.3.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.4.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.5.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.6.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.7.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.8.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.9.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.10.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.11.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.12.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.13.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.14.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.15.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.16.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.17.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.18.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.19.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.20.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.21.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.22.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.23.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.24.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.25.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.26.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.27.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.28.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.29.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.30.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.31.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.32.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.33.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.34.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.35.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.36.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.37.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.38.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.39.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.40.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.41.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.42.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.43.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.44.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.45.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.46.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.47.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.48.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.49.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.50.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.51.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.52.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.53.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.54.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.55.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.56.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.57.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.58.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.59.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.60.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.61.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.62.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.63.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.64.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.65.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.66.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.67.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.68.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.69.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.70.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.71.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.72.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.73.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.74.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.75.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.76.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.77.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.78.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.79.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.80.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.81.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.82.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.83.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.84.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.85.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight": "model-00095-of-000163.safetensors", + "model.layers.37.mlp.experts.86.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.87.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.88.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.89.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.90.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.91.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.92.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.93.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.94.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.95.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.96.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.97.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.98.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.99.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.100.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.101.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.102.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.103.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.104.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.105.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.106.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.107.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.108.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.109.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.110.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.111.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.112.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.113.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.114.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.115.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.116.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.117.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.118.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.119.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.120.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.121.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.122.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.123.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.124.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.125.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.126.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.127.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.128.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.129.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.130.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.131.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.132.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.133.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.134.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.135.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.136.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.137.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.138.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.139.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.140.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.141.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.142.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.143.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.144.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.145.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.146.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.147.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.148.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.149.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.150.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.151.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.152.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.153.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.154.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.155.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.156.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.157.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.158.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.159.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.160.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.161.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.162.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.163.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.164.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.165.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.166.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.167.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.168.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.169.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.170.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.171.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.172.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.173.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.174.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.175.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.176.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.177.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.178.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.179.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.180.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.181.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.182.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.down_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.183.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.gate_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.up_proj.weight": "model-00096-of-000163.safetensors", + "model.layers.37.mlp.experts.184.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.184.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.184.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.185.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.186.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.187.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.188.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.189.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.190.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.191.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.192.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.193.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.194.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.195.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.196.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.197.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.198.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.199.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.200.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.201.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.202.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.203.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.204.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.205.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.206.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.207.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.208.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.209.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.210.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.211.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.212.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.213.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.214.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.215.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.216.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.217.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.218.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.219.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.220.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.221.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.222.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.223.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.224.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.225.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.226.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.227.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.228.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.229.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.230.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.231.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.232.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.233.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.234.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.235.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.236.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.237.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.238.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.239.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.240.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.241.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.242.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.243.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.244.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.245.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.246.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.247.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.248.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.249.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.250.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.251.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.252.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.253.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.254.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.37.mlp.experts.255.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.37.input_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.37.post_attention_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_a_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_a_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_a_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_b_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.q_b_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_a_proj_with_mqa.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_a_layernorm.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_b_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.kv_b_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.o_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.self_attn.o_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.gate.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.gate.e_score_correction_bias": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.shared_experts.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.0.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.1.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.2.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.3.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.4.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.5.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.6.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.7.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.8.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.9.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.10.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.11.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.12.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.13.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.14.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.15.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.16.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.17.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.18.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.19.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight": "model-00097-of-000163.safetensors", + "model.layers.38.mlp.experts.20.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.21.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.22.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.23.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.24.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.25.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.26.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.27.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.28.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.29.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.30.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.31.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.32.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.33.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.34.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.35.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.36.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.37.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.38.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.39.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.40.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.41.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.42.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.43.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.44.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.45.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.46.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.47.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.48.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.49.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.50.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.51.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.52.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.53.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.54.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.55.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.56.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.57.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.58.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.59.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.60.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.61.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.62.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.63.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.64.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.65.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.66.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.67.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.68.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.69.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.70.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.71.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.72.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.73.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.74.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.75.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.76.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.77.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.78.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.79.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.80.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.81.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.82.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.83.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.84.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.85.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.86.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.87.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.88.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.89.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.90.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.91.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.92.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.93.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.94.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.95.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.96.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.97.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.98.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.99.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.100.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.101.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.102.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.103.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.104.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.105.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.106.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.107.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.108.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.109.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.110.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.111.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.112.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.113.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.114.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.115.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.116.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.117.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight": "model-00098-of-000163.safetensors", + "model.layers.38.mlp.experts.118.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.118.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.119.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.120.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.121.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.122.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.123.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.124.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.125.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.126.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.127.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.128.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.129.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.130.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.131.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.132.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.133.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.134.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.135.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.136.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.137.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.138.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.139.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.140.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.141.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.142.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.143.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.144.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.145.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.146.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.147.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.148.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.149.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.150.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.151.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.152.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.153.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.154.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.155.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.156.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.157.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.158.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.159.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.160.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.161.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.162.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.163.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.164.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.165.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.166.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.167.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.168.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.169.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.170.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.171.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.172.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.173.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.174.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.175.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.176.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.177.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.178.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.179.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.180.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.181.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.182.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.183.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.184.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.185.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.186.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.187.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.188.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.189.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.190.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.191.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.192.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.193.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.194.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.195.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.196.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.197.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.198.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.199.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.200.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.201.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.202.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.203.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.204.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.205.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.206.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.207.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.208.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.209.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.210.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.211.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.212.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.213.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.214.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.up_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.down_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.215.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.216.gate_proj.weight": "model-00099-of-000163.safetensors", + "model.layers.38.mlp.experts.216.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.216.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.216.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.216.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.216.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.217.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.218.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.219.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.220.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.221.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.222.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.223.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.224.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.225.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.226.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.227.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.228.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.229.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.230.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.231.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.232.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.233.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.234.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.235.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.236.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.237.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.238.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.239.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.240.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.241.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.242.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.243.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.244.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.245.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.246.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.247.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.248.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.249.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.250.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.251.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.252.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.253.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.254.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.gate_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.up_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.down_proj.weight": "model-00100-of-000163.safetensors", + "model.layers.38.mlp.experts.255.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", + "model.layers.38.input_layernorm.weight": "model-00100-of-000163.safetensors", + "model.layers.38.post_attention_layernorm.weight": "model-00100-of-000163.safetensors", + "model.layers.39.self_attn.q_a_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.q_a_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.q_a_layernorm.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.q_b_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.q_b_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_a_proj_with_mqa.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_a_layernorm.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_b_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.kv_b_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.o_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.self_attn.o_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.gate.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.gate.e_score_correction_bias": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.shared_experts.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.0.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.1.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.2.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.3.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.4.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.5.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.6.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.7.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.8.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.9.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.10.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.11.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.12.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.13.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.14.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.15.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.16.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.17.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.18.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.19.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.20.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.21.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.22.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.23.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.24.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.25.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.26.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.27.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.28.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.29.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.30.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.31.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.32.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.33.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.34.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.35.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.36.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.37.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.38.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.39.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.40.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.41.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.42.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.43.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.44.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.45.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.46.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.47.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.48.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.49.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.50.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.51.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.52.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.53.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.54.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.55.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.56.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.57.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.58.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.59.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.60.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.61.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.62.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.63.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.64.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.65.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.66.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.67.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.68.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.69.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.70.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.71.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.72.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.73.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.74.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.75.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.76.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.77.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.78.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.79.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.80.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.81.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.82.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.83.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.84.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.85.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.86.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.87.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.88.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.89.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.90.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.91.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00101-of-000163.safetensors", + "model.layers.39.mlp.experts.92.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.92.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.92.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.93.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.94.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.95.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.96.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.97.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.98.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.99.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.100.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.101.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.102.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.103.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.104.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.105.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.106.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.107.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.108.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.109.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.110.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.111.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.112.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.113.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.114.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.115.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.116.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.117.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.118.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.119.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.120.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.121.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.122.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.123.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.124.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.125.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.126.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.127.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.128.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.129.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.130.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.131.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.132.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.133.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.134.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.135.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.136.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.137.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.138.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.139.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.140.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.141.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.142.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.143.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.144.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.145.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.146.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.147.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.148.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.149.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.150.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.151.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.152.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.153.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.154.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.155.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.156.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.157.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.158.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.159.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.160.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.161.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.162.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.163.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.164.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.165.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.166.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.167.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.168.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.169.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.170.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.171.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.172.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.173.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.174.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.175.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.176.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.177.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.178.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.179.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.180.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.181.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.182.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.183.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.184.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.185.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.186.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.187.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.188.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.gate_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.up_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.down_proj.weight": "model-00102-of-000163.safetensors", + "model.layers.39.mlp.experts.189.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.190.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.191.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.192.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.193.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.194.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.195.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.196.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.197.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.198.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.199.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.200.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.201.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.202.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.203.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.204.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.205.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.206.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.207.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.208.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.209.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.210.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.211.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.212.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.213.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.214.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.215.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.216.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.217.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.218.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.219.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.220.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.221.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.222.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.223.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.224.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.225.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.226.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.227.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.228.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.229.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.230.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.231.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.232.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.233.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.234.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.235.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.236.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.237.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.238.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.239.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.240.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.241.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.242.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.243.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.244.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.245.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.246.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.247.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.248.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.249.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.250.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.251.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.252.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.253.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.254.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.39.mlp.experts.255.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.39.input_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.39.post_attention_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_a_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_a_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_a_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_b_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.q_b_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_a_proj_with_mqa.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_a_layernorm.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_b_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.kv_b_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.o_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.self_attn.o_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.gate.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.gate.e_score_correction_bias": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.shared_experts.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.0.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.1.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.2.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.3.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.4.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.5.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.6.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.7.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.8.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.9.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.10.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.11.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.12.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.13.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.14.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.15.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.16.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.17.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.18.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.19.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.20.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.21.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.22.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.23.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.24.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.25.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00103-of-000163.safetensors", + "model.layers.40.mlp.experts.26.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.26.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.26.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.27.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.28.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.29.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.30.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.31.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.32.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.33.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.34.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.35.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.36.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.37.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.38.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.39.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.40.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.41.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.42.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.43.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.44.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.45.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.46.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.47.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.48.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.49.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.50.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.51.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.52.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.53.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.54.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.55.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.56.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.57.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.58.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.59.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.60.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.61.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.62.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.63.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.64.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.65.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.66.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.67.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.68.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.69.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.70.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.71.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.72.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.73.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.74.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.75.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.76.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.77.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.78.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.79.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.80.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.81.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.82.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.83.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.84.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.85.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.86.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.87.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.88.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.89.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.90.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.91.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.92.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.93.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.94.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.95.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.96.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.97.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.98.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.99.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.100.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.101.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.102.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.103.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.104.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.105.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.106.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.107.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.108.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.109.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.110.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.111.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.112.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.113.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.114.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.115.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.116.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.117.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.118.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.119.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.120.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.121.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.122.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight": "model-00104-of-000163.safetensors", + "model.layers.40.mlp.experts.123.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.124.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.125.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.126.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.127.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.128.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.129.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.130.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.131.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.132.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.133.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.134.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.135.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.136.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.137.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.138.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.139.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.140.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.141.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.142.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.143.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.144.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.145.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.146.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.147.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.148.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.149.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.150.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.151.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.152.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.153.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.154.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.155.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.156.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.157.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.158.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.159.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.160.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.161.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.162.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.163.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.164.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.165.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.166.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.167.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.168.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.169.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.170.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.171.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.172.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.173.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.174.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.175.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.176.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.177.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.178.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.179.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.180.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.181.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.182.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.183.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.184.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.185.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.186.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.187.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.188.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.189.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.190.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.191.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.192.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.193.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.194.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.195.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.196.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.197.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.198.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.199.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.200.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.201.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.202.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.203.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.204.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.205.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.206.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.207.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.208.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.209.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.210.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.211.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.212.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.213.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.214.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.215.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.216.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.217.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.218.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.219.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.down_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.220.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.gate_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.up_proj.weight": "model-00105-of-000163.safetensors", + "model.layers.40.mlp.experts.221.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.221.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.221.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.222.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.223.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.224.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.225.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.226.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.227.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.228.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.229.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.230.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.231.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.232.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.233.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.234.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.235.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.236.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.237.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.238.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.239.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.240.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.241.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.242.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.243.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.244.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.245.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.246.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.247.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.248.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.249.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.250.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.251.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.252.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.253.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.254.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.40.mlp.experts.255.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.40.input_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.40.post_attention_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_a_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_a_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_a_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_b_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.q_b_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_a_proj_with_mqa.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_a_layernorm.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_b_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.kv_b_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.o_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.self_attn.o_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.gate.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.gate.e_score_correction_bias": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.shared_experts.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.0.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.1.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.2.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.3.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.4.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.5.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.6.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.7.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.8.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.9.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.10.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.11.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.12.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.13.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.14.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.15.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.16.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.17.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.18.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.19.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.20.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.21.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.22.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.23.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.24.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.25.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.26.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.27.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.28.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.29.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.30.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.31.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.32.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.33.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.34.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.35.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.36.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.37.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.38.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.39.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.40.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.41.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.42.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.43.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.44.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.45.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.46.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.47.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.48.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.49.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.50.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.51.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.52.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.53.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.54.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.55.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.56.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight": "model-00106-of-000163.safetensors", + "model.layers.41.mlp.experts.57.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.58.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.59.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.60.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.61.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.62.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.63.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.64.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.65.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.66.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.67.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.68.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.69.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.70.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.71.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.72.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.73.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.74.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.75.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.76.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.77.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.78.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.79.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.80.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.81.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.82.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.83.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.84.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.85.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.86.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.87.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.88.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.89.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.90.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.91.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.92.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.93.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.94.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.95.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.96.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.97.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.98.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.99.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.100.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.101.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.102.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.103.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.104.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.105.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.106.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.107.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.108.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.109.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.110.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.111.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.112.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.113.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.114.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.115.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.116.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.117.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.118.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.119.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.120.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.121.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.122.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.123.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.124.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.125.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.126.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.127.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.128.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.129.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.130.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.131.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.132.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.133.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.134.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.135.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.136.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.137.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.138.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.139.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.140.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.141.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.142.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.143.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.144.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.145.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.146.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.147.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.148.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.149.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.150.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.151.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.152.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.153.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.down_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.154.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.up_proj.weight": "model-00107-of-000163.safetensors", + "model.layers.41.mlp.experts.155.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.155.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.155.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.156.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.157.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.158.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.159.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.160.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.161.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.162.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.163.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.164.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.165.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.166.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.167.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.168.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.169.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.170.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.171.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.172.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.173.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.174.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.175.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.176.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.177.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.178.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.179.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.180.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.181.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.182.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.183.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.184.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.185.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.186.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.187.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.188.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.189.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.190.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.191.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.192.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.193.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.194.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.195.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.196.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.197.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.198.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.199.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.200.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.201.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.202.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.203.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.204.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.205.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.206.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.207.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.208.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.209.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.210.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.211.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.212.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.213.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.214.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.215.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.216.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.217.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.218.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.219.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.220.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.221.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.222.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.223.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.224.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.225.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.226.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.227.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.228.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.229.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.230.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.231.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.232.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.233.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.234.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.235.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.236.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.237.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.238.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.239.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.240.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.241.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.242.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.243.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.244.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.245.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.246.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.247.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.248.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.249.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.250.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.251.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.up_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.down_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.252.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.253.gate_proj.weight": "model-00108-of-000163.safetensors", + "model.layers.41.mlp.experts.253.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.253.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.253.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.253.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.253.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.254.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.41.mlp.experts.255.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.41.input_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.41.post_attention_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_a_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_a_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_a_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_b_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.q_b_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_a_proj_with_mqa.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_a_layernorm.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_b_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.kv_b_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.o_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.self_attn.o_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.gate.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.gate.e_score_correction_bias": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.shared_experts.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.0.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.1.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.2.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.3.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.4.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.5.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.6.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.7.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.8.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.9.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.10.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.11.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.12.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.13.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.14.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.15.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.16.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.17.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.18.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.19.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.20.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.21.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.22.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.23.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.24.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.25.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.26.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.27.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.28.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.29.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.30.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.31.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.32.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.33.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.34.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.35.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.36.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.37.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.38.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.39.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.40.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.41.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.42.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.43.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.44.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.45.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.46.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.47.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.48.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.49.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.50.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.51.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.52.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.53.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.54.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.55.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.56.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.57.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.58.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.59.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.60.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.61.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.62.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.63.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.64.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.65.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.66.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.67.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.68.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.69.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.70.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.71.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.72.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.73.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.74.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.75.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.76.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.77.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.78.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.79.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.80.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.81.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.82.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.83.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.84.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.85.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.86.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.87.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.88.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight": "model-00109-of-000163.safetensors", + "model.layers.42.mlp.experts.89.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.89.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.90.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.91.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.92.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.93.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.94.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.95.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.96.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.97.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.98.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.99.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.100.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.101.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.102.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.103.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.104.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.105.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.106.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.107.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.108.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.109.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.110.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.111.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.112.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.113.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.114.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.115.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.116.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.117.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.118.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.119.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.120.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.121.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.122.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.123.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.124.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.125.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.126.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.127.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.128.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.129.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.130.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.131.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.132.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.133.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.134.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.135.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.136.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.137.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.138.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.139.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.140.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.141.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.142.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.143.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.144.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.145.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.146.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.147.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.148.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.149.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.150.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.151.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.152.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.153.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.154.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.155.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.156.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.157.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.158.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.159.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.160.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.161.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.162.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.163.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.164.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.165.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.166.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.167.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.168.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.169.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.170.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.171.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.172.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.173.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.174.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.175.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.176.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.177.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.178.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.179.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.180.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.181.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.182.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.183.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.184.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.185.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.up_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.down_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.186.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.187.gate_proj.weight": "model-00110-of-000163.safetensors", + "model.layers.42.mlp.experts.187.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.187.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.187.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.187.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.187.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.188.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.189.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.190.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.191.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.192.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.193.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.194.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.195.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.196.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.197.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.198.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.199.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.200.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.201.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.202.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.203.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.204.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.205.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.206.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.207.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.208.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.209.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.210.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.211.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.212.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.213.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.214.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.215.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.216.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.217.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.218.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.219.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.220.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.221.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.222.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.223.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.224.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.225.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.226.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.227.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.228.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.229.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.230.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.231.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.232.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.233.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.234.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.235.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.236.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.237.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.238.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.239.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.240.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.241.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.242.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.243.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.244.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.245.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.246.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.247.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.248.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.249.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.250.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.251.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.252.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.253.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.254.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.42.mlp.experts.255.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.42.input_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.42.post_attention_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_a_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_a_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_a_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_b_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.q_b_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_a_proj_with_mqa.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_a_layernorm.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_b_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.kv_b_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.o_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.self_attn.o_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.gate.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.gate.e_score_correction_bias": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.shared_experts.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.0.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.1.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.2.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.3.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.4.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.5.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.6.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.7.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.8.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.9.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.10.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.11.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.12.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.13.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.14.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.15.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.16.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.17.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.18.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.19.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.20.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.21.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.22.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight": "model-00111-of-000163.safetensors", + "model.layers.43.mlp.experts.23.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.23.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.24.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.25.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.26.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.27.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.28.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.29.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.30.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.31.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.32.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.33.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.34.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.35.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.36.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.37.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.38.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.39.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.40.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.41.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.42.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.43.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.44.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.45.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.46.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.47.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.48.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.49.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.50.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.51.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.52.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.53.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.54.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.55.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.56.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.57.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.58.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.59.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.60.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.61.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.62.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.63.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.64.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.65.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.66.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.67.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.68.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.69.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.70.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.71.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.72.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.73.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.74.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.75.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.76.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.77.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.78.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.79.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.80.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.81.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.82.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.83.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.84.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.85.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.86.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.87.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.88.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.89.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.90.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.91.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.92.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.93.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.94.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.95.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.96.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.97.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.98.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.99.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.100.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.101.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.102.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.103.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.104.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.105.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.106.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.107.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.108.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.109.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.110.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.111.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.112.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.113.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.114.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.115.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.116.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.117.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.118.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.119.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.120.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00112-of-000163.safetensors", + "model.layers.43.mlp.experts.121.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.121.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.121.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.122.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.123.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.124.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.125.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.126.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.127.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.128.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.129.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.130.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.131.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.132.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.133.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.134.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.135.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.136.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.137.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.138.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.139.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.140.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.141.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.142.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.143.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.144.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.145.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.146.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.147.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.148.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.149.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.150.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.151.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.152.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.153.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.154.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.155.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.156.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.157.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.158.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.159.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.160.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.161.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.162.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.163.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.164.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.165.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.166.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.167.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.168.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.169.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.170.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.171.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.172.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.173.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.174.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.175.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.176.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.177.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.178.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.179.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.180.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.181.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.182.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.183.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.184.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.185.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.186.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.187.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.188.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.189.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.190.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.191.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.192.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.193.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.194.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.195.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.196.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.197.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.198.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.199.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.200.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.201.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.202.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.203.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.204.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.205.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.206.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.207.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.208.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.209.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.210.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.211.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.212.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.213.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.214.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.215.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.216.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.217.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.gate_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.up_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.down_proj.weight": "model-00113-of-000163.safetensors", + "model.layers.43.mlp.experts.218.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.219.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.220.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.221.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.222.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.223.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.224.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.225.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.226.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.227.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.228.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.229.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.230.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.231.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.232.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.233.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.234.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.235.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.236.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.237.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.238.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.239.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.240.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.241.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.242.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.243.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.244.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.245.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.246.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.247.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.248.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.249.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.250.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.251.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.252.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.253.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.254.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.43.mlp.experts.255.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.43.input_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.43.post_attention_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_a_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_a_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_a_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_b_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.q_b_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_a_proj_with_mqa.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_a_layernorm.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_b_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.kv_b_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.o_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.self_attn.o_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.gate.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.gate.e_score_correction_bias": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.shared_experts.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.0.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.1.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.2.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.3.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.4.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.5.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.6.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.7.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.8.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.9.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.10.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.11.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.12.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.13.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.14.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.15.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.16.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.17.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.18.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.19.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.20.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.21.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.22.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.23.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.24.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.25.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.26.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.27.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.28.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.29.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.30.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.31.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.32.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.33.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.34.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.35.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.36.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.37.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.38.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.39.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.40.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.41.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.42.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.43.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.44.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.45.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.46.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.47.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.48.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.49.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.50.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.51.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.52.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.53.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.54.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00114-of-000163.safetensors", + "model.layers.44.mlp.experts.55.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.55.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.55.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.56.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.57.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.58.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.59.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.60.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.61.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.62.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.63.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.64.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.65.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.66.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.67.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.68.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.69.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.70.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.71.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.72.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.73.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.74.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.75.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.76.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.77.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.78.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.79.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.80.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.81.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.82.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.83.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.84.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.85.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.86.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.87.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.88.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.89.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.90.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.91.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.92.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.93.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.94.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.95.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.96.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.97.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.98.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.99.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.100.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.101.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.102.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.103.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.104.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.105.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.106.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.107.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.108.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.109.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.110.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.111.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.112.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.113.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.114.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.115.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.116.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.117.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.118.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.119.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.120.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.121.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.122.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.123.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.124.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.125.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.126.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.127.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.128.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.129.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.130.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.131.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.132.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.133.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.134.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.135.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.136.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.137.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.138.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.139.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.140.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.141.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.142.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.143.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.144.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.145.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.146.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.147.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.148.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.149.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.150.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.151.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.up_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.down_proj.weight": "model-00115-of-000163.safetensors", + "model.layers.44.mlp.experts.152.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.153.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.154.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.155.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.156.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.157.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.158.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.159.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.160.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.161.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.162.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.163.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.164.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.165.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.166.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.167.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.168.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.169.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.170.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.171.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.172.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.173.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.174.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.175.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.176.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.177.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.178.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.179.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.180.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.181.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.182.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.183.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.184.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.185.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.186.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.187.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.188.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.189.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.190.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.191.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.192.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.193.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.194.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.195.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.196.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.197.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.198.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.199.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.200.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.201.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.202.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.203.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.204.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.205.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.206.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.207.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.208.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.209.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.210.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.211.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.212.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.213.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.214.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.215.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.216.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.217.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.218.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.219.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.220.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.221.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.222.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.223.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.224.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.225.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.226.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.227.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.228.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.229.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.230.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.231.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.232.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.233.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.234.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.235.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.236.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.237.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.238.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.239.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.240.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.241.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.242.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.243.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.244.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.245.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.246.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.247.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.248.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.down_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.249.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.gate_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.up_proj.weight": "model-00116-of-000163.safetensors", + "model.layers.44.mlp.experts.250.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.250.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.250.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.251.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.252.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.253.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.254.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.44.mlp.experts.255.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.44.input_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.44.post_attention_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_a_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_a_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_a_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_b_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.q_b_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_a_proj_with_mqa.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_a_layernorm.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_b_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.kv_b_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.o_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.self_attn.o_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.gate.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.gate.e_score_correction_bias": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.shared_experts.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.0.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.1.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.2.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.3.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.4.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.5.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.6.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.7.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.8.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.9.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.10.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.11.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.12.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.13.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.14.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.15.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.16.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.17.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.18.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.19.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.20.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.21.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.22.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.23.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.24.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.25.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.26.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.27.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.28.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.29.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.30.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.31.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.32.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.33.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.34.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.35.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.36.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.37.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.38.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.39.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.40.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.41.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.42.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.43.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.44.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.45.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.46.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.47.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.48.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.49.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.50.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.51.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.52.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.53.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.54.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.55.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.56.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.57.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.58.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.59.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.60.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.61.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.62.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.63.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.64.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.65.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.66.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.67.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.68.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.69.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.70.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.71.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.72.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.73.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.74.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.75.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.76.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.77.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.78.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.79.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.80.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.81.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.82.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.83.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.84.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.85.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight": "model-00117-of-000163.safetensors", + "model.layers.45.mlp.experts.86.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.87.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.88.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.89.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.90.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.91.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.92.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.93.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.94.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.95.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.96.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.97.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.98.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.99.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.100.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.101.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.102.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.103.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.104.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.105.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.106.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.107.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.108.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.109.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.110.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.111.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.112.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.113.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.114.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.115.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.116.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.117.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.118.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.119.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.120.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.121.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.122.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.123.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.124.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.125.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.126.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.127.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.128.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.129.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.130.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.131.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.132.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.133.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.134.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.135.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.136.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.137.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.138.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.139.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.140.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.141.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.142.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.143.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.144.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.145.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.146.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.147.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.148.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.149.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.150.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.151.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.152.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.153.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.154.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.155.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.156.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.157.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.158.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.159.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.160.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.161.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.162.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.163.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.164.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.165.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.166.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.167.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.168.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.169.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.170.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.171.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.172.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.173.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.174.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.175.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.176.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.177.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.178.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.179.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.180.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.181.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.182.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.down_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.183.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.gate_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.up_proj.weight": "model-00118-of-000163.safetensors", + "model.layers.45.mlp.experts.184.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.184.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.184.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.185.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.186.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.187.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.188.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.189.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.190.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.191.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.192.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.193.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.194.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.195.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.196.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.197.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.198.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.199.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.200.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.201.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.202.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.203.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.204.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.205.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.206.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.207.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.208.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.209.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.210.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.211.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.212.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.213.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.214.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.215.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.216.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.217.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.218.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.219.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.220.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.221.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.222.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.223.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.224.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.225.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.226.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.227.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.228.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.229.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.230.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.231.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.232.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.233.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.234.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.235.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.236.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.237.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.238.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.239.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.240.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.241.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.242.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.243.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.244.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.245.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.246.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.247.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.248.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.249.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.250.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.251.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.252.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.253.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.254.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.45.mlp.experts.255.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.45.input_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.45.post_attention_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_a_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_a_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_a_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_b_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.q_b_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_a_proj_with_mqa.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_a_layernorm.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_b_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.kv_b_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.o_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.self_attn.o_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.gate.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.gate.e_score_correction_bias": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.shared_experts.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.0.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.1.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.2.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.3.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.4.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.5.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.6.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.7.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.8.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.9.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.10.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.11.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.12.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.13.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.14.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.15.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.16.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.17.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.18.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.19.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight": "model-00119-of-000163.safetensors", + "model.layers.46.mlp.experts.20.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.21.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.22.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.23.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.24.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.25.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.26.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.27.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.28.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.29.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.30.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.31.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.32.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.33.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.34.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.35.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.36.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.37.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.38.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.39.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.40.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.41.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.42.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.43.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.44.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.45.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.46.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.47.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.48.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.49.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.50.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.51.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.52.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.53.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.54.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.55.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.56.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.57.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.58.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.59.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.60.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.61.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.62.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.63.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.64.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.65.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.66.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.67.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.68.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.69.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.70.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.71.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.72.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.73.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.74.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.75.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.76.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.77.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.78.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.79.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.80.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.81.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.82.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.83.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.84.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.85.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.86.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.87.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.88.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.89.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.90.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.91.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.92.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.93.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.94.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.95.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.96.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.97.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.98.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.99.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.100.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.101.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.102.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.103.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.104.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.105.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.106.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.107.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.108.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.109.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.110.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.111.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.112.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.113.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.114.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.115.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.116.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.117.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight": "model-00120-of-000163.safetensors", + "model.layers.46.mlp.experts.118.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.118.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.119.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.120.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.121.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.122.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.123.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.124.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.125.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.126.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.127.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.128.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.129.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.130.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.131.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.132.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.133.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.134.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.135.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.136.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.137.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.138.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.139.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.140.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.141.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.142.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.143.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.144.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.145.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.146.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.147.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.148.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.149.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.150.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.151.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.152.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.153.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.154.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.155.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.156.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.157.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.158.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.159.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.160.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.161.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.162.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.163.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.164.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.165.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.166.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.167.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.168.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.169.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.170.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.171.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.172.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.173.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.174.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.175.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.176.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.177.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.178.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.179.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.180.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.181.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.182.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.183.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.184.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.185.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.186.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.187.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.188.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.189.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.190.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.191.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.192.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.193.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.194.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.195.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.196.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.197.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.198.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.199.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.200.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.201.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.202.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.203.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.204.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.205.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.206.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.207.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.208.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.209.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.210.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.211.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.212.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.213.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.214.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.up_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.down_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.215.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.216.gate_proj.weight": "model-00121-of-000163.safetensors", + "model.layers.46.mlp.experts.216.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.216.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.216.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.216.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.216.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.217.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.218.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.219.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.220.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.221.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.222.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.223.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.224.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.225.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.226.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.227.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.228.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.229.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.230.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.231.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.232.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.233.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.234.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.235.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.236.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.237.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.238.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.239.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.240.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.241.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.242.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.243.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.244.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.245.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.246.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.247.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.248.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.249.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.250.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.251.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.252.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.253.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.254.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.gate_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.up_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.down_proj.weight": "model-00122-of-000163.safetensors", + "model.layers.46.mlp.experts.255.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", + "model.layers.46.input_layernorm.weight": "model-00122-of-000163.safetensors", + "model.layers.46.post_attention_layernorm.weight": "model-00122-of-000163.safetensors", + "model.layers.47.self_attn.q_a_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.q_a_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.q_a_layernorm.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.q_b_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.q_b_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_a_proj_with_mqa.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_a_layernorm.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_b_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.kv_b_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.o_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.self_attn.o_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.gate.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.gate.e_score_correction_bias": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.shared_experts.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.0.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.1.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.2.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.3.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.4.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.5.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.6.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.7.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.8.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.9.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.10.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.11.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.12.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.13.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.14.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.15.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.16.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.17.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.18.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.19.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.20.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.21.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.22.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.23.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.24.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.25.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.26.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.27.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.28.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.29.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.30.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.31.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.32.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.33.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.34.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.35.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.36.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.37.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.38.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.39.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.40.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.41.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.42.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.43.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.44.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.45.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.46.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.47.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.48.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.49.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.50.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.51.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.52.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.53.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.54.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.55.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.56.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.57.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.58.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.59.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.60.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.61.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.62.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.63.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.64.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.65.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.66.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.67.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.68.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.69.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.70.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.71.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.72.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.73.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.74.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.75.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.76.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.77.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.78.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.79.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.80.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.81.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.82.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.83.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.84.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.85.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.86.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.87.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.88.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.89.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.90.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.up_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.down_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.91.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00123-of-000163.safetensors", + "model.layers.47.mlp.experts.92.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.92.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.92.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.92.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.92.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.93.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.94.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.95.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.96.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.97.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.98.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.99.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.100.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.101.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.102.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.103.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.104.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.105.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.106.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.107.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.108.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.109.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.110.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.111.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.112.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.113.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.114.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.115.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.116.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.117.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.118.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.119.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.120.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.121.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.122.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.123.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.124.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.125.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.126.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.127.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.128.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.129.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.130.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.131.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.132.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.133.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.134.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.135.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.136.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.137.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.138.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.139.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.140.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.141.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.142.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.143.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.144.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.145.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.146.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.147.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.148.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.149.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.150.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.151.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.152.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.153.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.154.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.155.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.156.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.157.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.158.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.159.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.160.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.161.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.162.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.163.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.164.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.165.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.166.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.167.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.168.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.169.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.170.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.171.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.172.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.173.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.174.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.175.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.176.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.177.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.178.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.179.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.180.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.181.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.182.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.183.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.184.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.185.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.186.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.187.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.188.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.gate_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.up_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.down_proj.weight": "model-00124-of-000163.safetensors", + "model.layers.47.mlp.experts.189.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.190.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.191.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.192.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.193.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.194.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.195.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.196.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.197.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.198.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.199.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.200.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.201.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.202.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.203.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.204.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.205.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.206.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.207.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.208.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.209.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.210.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.211.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.212.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.213.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.214.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.215.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.216.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.217.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.218.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.219.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.220.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.221.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.222.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.223.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.224.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.225.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.226.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.227.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.228.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.229.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.230.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.231.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.232.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.233.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.234.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.235.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.236.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.237.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.238.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.239.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.240.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.241.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.242.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.243.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.244.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.245.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.246.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.247.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.248.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.249.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.250.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.251.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.252.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.253.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.254.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.47.mlp.experts.255.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.47.input_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.47.post_attention_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_a_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_a_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_a_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_b_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.q_b_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_a_proj_with_mqa.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_a_layernorm.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_b_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.kv_b_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.o_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.self_attn.o_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.gate.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.gate.e_score_correction_bias": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.shared_experts.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.0.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.1.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.2.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.3.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.4.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.5.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.6.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.7.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.8.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.9.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.10.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.11.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.12.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.13.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.14.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.15.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.16.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.17.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.18.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.19.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.20.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.21.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.22.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.23.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.24.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.up_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.down_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.25.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00125-of-000163.safetensors", + "model.layers.48.mlp.experts.26.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.26.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.26.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.26.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.26.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.27.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.28.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.29.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.30.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.31.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.32.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.33.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.34.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.35.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.36.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.37.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.38.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.39.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.40.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.41.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.42.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.43.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.44.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.45.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.46.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.47.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.48.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.49.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.50.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.51.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.52.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.53.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.54.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.55.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.56.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.57.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.58.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.59.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.60.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.61.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.62.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.63.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.64.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.65.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.66.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.67.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.68.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.69.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.70.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.71.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.72.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.73.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.74.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.75.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.76.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.77.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.78.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.79.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.80.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.81.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.82.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.83.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.84.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.85.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.86.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.87.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.88.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.89.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.90.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.91.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.92.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.93.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.94.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.95.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.96.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.97.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.98.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.99.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.100.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.101.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.102.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.103.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.104.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.105.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.106.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.107.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.108.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.109.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.110.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.111.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.112.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.113.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.114.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.115.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.116.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.117.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.118.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.119.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.120.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.121.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.122.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.up_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.down_proj.weight": "model-00126-of-000163.safetensors", + "model.layers.48.mlp.experts.123.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.124.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.125.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.126.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.127.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.128.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.129.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.130.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.131.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.132.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.133.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.134.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.135.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.136.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.137.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.138.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.139.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.140.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.141.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.142.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.143.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.144.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.145.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.146.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.147.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.148.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.149.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.150.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.151.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.152.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.153.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.154.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.155.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.156.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.157.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.158.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.159.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.160.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.161.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.162.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.163.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.164.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.165.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.166.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.167.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.168.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.169.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.170.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.171.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.172.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.173.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.174.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.175.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.176.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.177.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.178.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.179.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.180.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.181.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.182.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.183.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.184.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.185.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.186.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.187.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.188.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.189.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.190.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.191.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.192.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.193.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.194.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.195.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.196.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.197.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.198.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.199.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.200.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.201.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.202.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.203.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.204.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.205.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.206.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.207.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.208.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.209.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.210.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.211.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.212.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.213.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.214.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.215.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.216.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.217.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.218.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.219.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.down_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.220.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.gate_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.up_proj.weight": "model-00127-of-000163.safetensors", + "model.layers.48.mlp.experts.221.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.221.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.221.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.222.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.223.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.224.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.225.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.226.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.227.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.228.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.229.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.230.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.231.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.232.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.233.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.234.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.235.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.236.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.237.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.238.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.239.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.240.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.241.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.242.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.243.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.244.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.245.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.246.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.247.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.248.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.249.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.250.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.251.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.252.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.253.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.254.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.48.mlp.experts.255.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.48.input_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.48.post_attention_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_a_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_a_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_a_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_b_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.q_b_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_a_proj_with_mqa.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_a_layernorm.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_b_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.kv_b_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.o_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.self_attn.o_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.gate.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.gate.e_score_correction_bias": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.shared_experts.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.0.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.1.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.2.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.3.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.4.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.5.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.6.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.7.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.8.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.9.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.10.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.11.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.12.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.13.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.14.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.15.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.16.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.17.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.18.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.19.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.20.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.21.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.22.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.23.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.24.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.25.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.26.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.27.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.28.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.29.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.30.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.31.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.32.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.33.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.34.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.35.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.36.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.37.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.38.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.39.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.40.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.41.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.42.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.43.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.44.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.45.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.46.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.47.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.48.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.49.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.50.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.51.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.52.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.53.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.54.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.55.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.56.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.up_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.down_proj.weight": "model-00128-of-000163.safetensors", + "model.layers.49.mlp.experts.57.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.58.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.59.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.60.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.61.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.62.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.63.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.64.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.65.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.66.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.67.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.68.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.69.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.70.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.71.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.72.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.73.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.74.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.75.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.76.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.77.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.78.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.79.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.80.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.81.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.82.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.83.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.84.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.85.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.86.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.87.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.88.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.89.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.90.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.91.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.92.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.93.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.94.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.95.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.96.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.97.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.98.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.99.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.100.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.101.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.102.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.103.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.104.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.105.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.106.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.107.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.108.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.109.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.110.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.111.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.112.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.113.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.114.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.115.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.116.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.117.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.118.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.119.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.120.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.121.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.122.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.123.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.124.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.125.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.126.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.127.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.128.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.129.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.130.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.131.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.132.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.133.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.134.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.135.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.136.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.137.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.138.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.139.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.140.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.141.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.142.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.143.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.144.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.145.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.146.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.147.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.148.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.149.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.150.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.151.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.152.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.153.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.down_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.154.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.up_proj.weight": "model-00129-of-000163.safetensors", + "model.layers.49.mlp.experts.155.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.155.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.155.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.156.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.157.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.158.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.159.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.160.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.161.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.162.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.163.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.164.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.165.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.166.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.167.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.168.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.169.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.170.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.171.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.172.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.173.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.174.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.175.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.176.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.177.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.178.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.179.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.180.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.181.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.182.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.183.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.184.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.185.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.186.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.187.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.188.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.189.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.190.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.191.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.192.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.193.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.194.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.195.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.196.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.197.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.198.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.199.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.200.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.201.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.202.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.203.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.204.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.205.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.206.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.207.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.208.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.209.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.210.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.211.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.212.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.213.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.214.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.215.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.216.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.217.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.218.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.219.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.220.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.221.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.222.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.223.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.224.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.225.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.226.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.227.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.228.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.229.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.230.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.231.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.232.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.233.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.234.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.235.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.236.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.237.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.238.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.239.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.240.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.241.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.242.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.243.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.244.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.245.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.246.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.247.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.248.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.249.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.250.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.251.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.up_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.down_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.252.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.253.gate_proj.weight": "model-00130-of-000163.safetensors", + "model.layers.49.mlp.experts.253.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.253.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.253.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.253.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.253.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.254.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.49.mlp.experts.255.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.49.input_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.49.post_attention_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_a_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_a_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_a_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_b_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.q_b_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_a_proj_with_mqa.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_a_layernorm.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_b_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.kv_b_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.o_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.self_attn.o_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.gate.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.gate.e_score_correction_bias": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.shared_experts.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.0.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.1.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.2.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.3.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.4.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.5.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.6.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.7.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.8.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.9.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.10.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.11.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.12.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.13.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.14.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.15.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.16.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.17.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.18.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.19.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.20.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.21.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.22.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.23.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.24.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.25.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.26.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.27.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.28.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.29.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.30.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.31.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.32.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.33.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.34.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.35.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.36.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.37.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.38.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.39.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.40.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.41.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.42.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.43.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.44.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.45.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.46.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.47.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.48.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.49.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.50.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.51.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.52.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.53.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.54.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.55.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.56.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.57.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.58.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.59.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.60.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.61.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.62.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.63.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.64.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.65.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.66.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.67.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.68.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.69.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.70.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.71.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.72.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.73.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.74.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.75.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.76.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.77.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.78.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.79.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.80.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.81.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.82.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.83.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.84.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.85.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.86.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.87.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.down_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.88.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.up_proj.weight": "model-00131-of-000163.safetensors", + "model.layers.50.mlp.experts.89.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.89.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.89.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.90.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.91.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.92.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.93.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.94.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.95.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.96.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.97.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.98.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.99.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.100.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.101.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.102.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.103.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.104.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.105.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.106.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.107.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.108.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.109.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.110.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.111.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.112.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.113.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.114.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.115.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.116.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.117.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.118.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.119.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.120.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.121.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.122.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.123.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.124.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.125.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.126.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.127.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.128.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.129.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.130.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.131.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.132.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.133.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.134.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.135.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.136.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.137.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.138.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.139.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.140.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.141.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.142.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.143.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.144.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.145.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.146.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.147.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.148.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.149.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.150.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.151.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.152.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.153.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.154.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.155.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.156.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.157.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.158.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.159.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.160.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.161.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.162.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.163.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.164.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.165.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.166.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.167.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.168.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.169.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.170.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.171.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.172.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.173.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.174.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.175.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.176.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.177.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.178.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.179.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.180.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.181.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.182.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.183.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.184.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.185.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.up_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.down_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.186.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.187.gate_proj.weight": "model-00132-of-000163.safetensors", + "model.layers.50.mlp.experts.187.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.187.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.187.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.187.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.187.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.188.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.189.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.190.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.191.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.192.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.193.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.194.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.195.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.196.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.197.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.198.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.199.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.200.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.201.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.202.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.203.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.204.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.205.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.206.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.207.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.208.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.209.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.210.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.211.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.212.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.213.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.214.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.215.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.216.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.217.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.218.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.219.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.220.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.221.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.222.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.223.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.224.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.225.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.226.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.227.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.228.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.229.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.230.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.231.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.232.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.233.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.234.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.235.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.236.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.237.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.238.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.239.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.240.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.241.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.242.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.243.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.244.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.245.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.246.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.247.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.248.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.249.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.250.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.251.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.252.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.253.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.254.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.50.mlp.experts.255.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.50.input_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.50.post_attention_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_a_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_a_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_a_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_b_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.q_b_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_a_proj_with_mqa.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_a_layernorm.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_b_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.kv_b_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.o_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.self_attn.o_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.gate.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.gate.e_score_correction_bias": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.shared_experts.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.0.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.1.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.2.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.3.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.4.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.5.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.6.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.7.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.8.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.9.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.10.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.11.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.12.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.13.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.14.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.15.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.16.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.17.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.18.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.19.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.20.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.21.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.down_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.22.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.up_proj.weight": "model-00133-of-000163.safetensors", + "model.layers.51.mlp.experts.23.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.23.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.23.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.24.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.25.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.26.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.27.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.28.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.29.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.30.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.31.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.32.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.33.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.34.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.35.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.36.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.37.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.38.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.39.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.40.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.41.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.42.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.43.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.44.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.45.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.46.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.47.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.48.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.49.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.50.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.51.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.52.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.53.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.54.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.55.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.56.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.57.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.58.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.59.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.60.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.61.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.62.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.63.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.64.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.65.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.66.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.67.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.68.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.69.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.70.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.71.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.72.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.73.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.74.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.75.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.76.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.77.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.78.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.79.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.80.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.81.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.82.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.83.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.84.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.85.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.86.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.87.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.88.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.89.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.90.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.91.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.92.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.93.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.94.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.95.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.96.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.97.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.98.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.99.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.100.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.101.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.102.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.103.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.104.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.105.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.106.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.107.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.108.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.109.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.110.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.111.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.112.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.113.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.114.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.115.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.116.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.117.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.118.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.119.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.up_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.down_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.120.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00134-of-000163.safetensors", + "model.layers.51.mlp.experts.121.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.121.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.121.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.121.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.121.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.122.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.123.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.124.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.125.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.126.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.127.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.128.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.129.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.130.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.131.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.132.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.133.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.134.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.135.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.136.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.137.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.138.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.139.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.140.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.141.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.142.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.143.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.144.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.145.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.146.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.147.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.148.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.149.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.150.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.151.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.152.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.153.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.154.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.155.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.156.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.157.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.158.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.159.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.160.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.161.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.162.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.163.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.164.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.165.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.166.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.167.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.168.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.169.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.170.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.171.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.172.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.173.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.174.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.175.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.176.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.177.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.178.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.179.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.180.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.181.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.182.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.183.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.184.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.185.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.186.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.187.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.188.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.189.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.190.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.191.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.192.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.193.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.194.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.195.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.196.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.197.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.198.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.199.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.200.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.201.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.202.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.203.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.204.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.205.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.206.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.207.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.208.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.209.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.210.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.211.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.212.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.213.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.214.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.215.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.216.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.217.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.gate_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.up_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.down_proj.weight": "model-00135-of-000163.safetensors", + "model.layers.51.mlp.experts.218.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.219.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.220.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.221.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.222.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.223.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.224.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.225.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.226.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.227.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.228.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.229.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.230.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.231.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.232.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.233.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.234.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.235.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.236.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.237.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.238.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.239.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.240.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.241.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.242.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.243.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.244.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.245.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.246.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.247.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.248.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.249.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.250.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.251.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.252.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.253.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.254.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.51.mlp.experts.255.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.51.input_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.51.post_attention_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_a_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_a_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_a_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_b_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.q_b_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_a_proj_with_mqa.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_a_layernorm.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_b_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.kv_b_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.o_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.self_attn.o_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.gate.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.gate.e_score_correction_bias": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.shared_experts.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.0.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.1.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.2.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.3.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.4.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.5.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.6.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.7.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.8.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.9.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.10.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.11.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.12.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.13.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.14.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.15.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.16.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.17.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.18.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.19.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.20.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.21.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.22.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.23.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.24.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.25.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.26.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.27.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.28.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.29.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.30.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.31.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.32.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.33.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.34.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.35.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.36.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.37.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.38.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.39.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.40.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.41.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.42.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.43.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.44.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.45.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.46.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.47.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.48.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.49.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.50.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.51.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.52.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.53.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.up_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.down_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.54.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00136-of-000163.safetensors", + "model.layers.52.mlp.experts.55.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.55.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.55.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.55.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.55.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.56.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.57.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.58.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.59.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.60.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.61.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.62.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.63.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.64.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.65.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.66.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.67.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.68.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.69.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.70.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.71.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.72.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.73.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.74.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.75.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.76.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.77.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.78.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.79.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.80.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.81.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.82.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.83.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.84.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.85.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.86.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.87.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.88.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.89.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.90.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.91.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.92.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.93.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.94.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.95.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.96.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.97.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.98.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.99.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.100.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.101.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.102.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.103.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.104.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.105.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.106.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.107.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.108.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.109.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.110.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.111.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.112.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.113.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.114.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.115.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.116.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.117.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.118.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.119.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.120.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.121.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.122.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.123.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.124.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.125.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.126.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.127.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.128.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.129.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.130.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.131.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.132.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.133.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.134.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.135.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.136.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.137.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.138.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.139.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.140.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.141.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.142.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.143.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.144.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.145.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.146.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.147.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.148.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.149.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.150.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.151.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.up_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.down_proj.weight": "model-00137-of-000163.safetensors", + "model.layers.52.mlp.experts.152.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.153.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.154.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.155.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.156.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.157.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.158.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.159.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.160.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.161.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.162.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.163.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.164.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.165.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.166.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.167.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.168.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.169.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.170.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.171.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.172.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.173.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.174.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.175.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.176.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.177.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.178.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.179.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.180.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.181.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.182.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.183.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.184.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.185.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.186.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.187.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.188.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.189.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.190.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.191.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.192.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.193.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.194.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.195.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.196.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.197.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.198.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.199.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.200.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.201.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.202.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.203.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.204.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.205.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.206.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.207.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.208.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.209.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.210.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.211.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.212.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.213.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.214.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.215.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.216.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.217.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.218.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.219.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.220.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.221.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.222.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.223.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.224.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.225.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.226.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.227.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.228.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.229.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.230.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.231.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.232.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.233.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.234.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.235.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.236.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.237.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.238.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.239.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.240.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.241.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.242.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.243.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.244.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.245.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.246.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.247.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.248.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.down_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.249.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.gate_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.up_proj.weight": "model-00138-of-000163.safetensors", + "model.layers.52.mlp.experts.250.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.250.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.250.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.251.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.252.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.253.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.254.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.52.mlp.experts.255.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.52.input_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.52.post_attention_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_a_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_a_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_a_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_b_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.q_b_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_a_proj_with_mqa.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_a_layernorm.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_b_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.kv_b_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.o_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.self_attn.o_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.gate.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.gate.e_score_correction_bias": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.shared_experts.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.0.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.1.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.2.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.3.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.4.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.5.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.6.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.7.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.8.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.9.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.10.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.11.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.12.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.13.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.14.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.15.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.16.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.17.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.18.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.19.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.20.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.21.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.22.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.23.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.24.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.25.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.26.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.27.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.28.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.29.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.30.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.31.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.32.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.33.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.34.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.35.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.36.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.37.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.38.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.39.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.40.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.41.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.42.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.43.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.44.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.45.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.46.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.47.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.48.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.49.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.50.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.51.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.52.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.53.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.54.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.55.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.56.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.57.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.58.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.59.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.60.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.61.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.62.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.63.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.64.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.65.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.66.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.67.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.68.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.69.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.70.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.71.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.72.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.73.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.74.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.75.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.76.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.77.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.78.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.79.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.80.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.81.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.82.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.83.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.84.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.85.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.up_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.down_proj.weight": "model-00139-of-000163.safetensors", + "model.layers.53.mlp.experts.86.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.87.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.88.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.89.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.90.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.91.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.92.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.93.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.94.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.95.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.96.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.97.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.98.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.99.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.100.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.101.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.102.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.103.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.104.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.105.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.106.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.107.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.108.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.109.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.110.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.111.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.112.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.113.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.114.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.115.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.116.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.117.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.118.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.119.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.120.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.121.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.122.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.123.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.124.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.125.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.126.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.127.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.128.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.129.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.130.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.131.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.132.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.133.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.134.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.135.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.136.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.137.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.138.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.139.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.140.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.141.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.142.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.143.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.144.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.145.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.146.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.147.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.148.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.149.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.150.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.151.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.152.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.153.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.154.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.155.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.156.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.157.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.158.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.159.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.160.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.161.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.162.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.163.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.164.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.165.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.166.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.167.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.168.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.169.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.170.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.171.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.172.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.173.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.174.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.175.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.176.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.177.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.178.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.179.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.180.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.181.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.182.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.down_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.183.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.gate_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.up_proj.weight": "model-00140-of-000163.safetensors", + "model.layers.53.mlp.experts.184.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.184.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.184.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.185.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.186.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.187.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.188.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.189.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.190.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.191.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.192.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.193.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.194.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.195.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.196.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.197.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.198.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.199.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.200.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.201.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.202.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.203.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.204.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.205.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.206.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.207.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.208.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.209.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.210.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.211.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.212.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.213.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.214.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.215.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.216.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.217.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.218.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.219.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.220.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.221.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.222.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.223.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.224.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.225.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.226.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.227.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.228.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.229.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.230.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.231.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.232.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.233.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.234.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.235.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.236.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.237.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.238.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.239.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.240.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.241.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.242.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.243.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.244.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.245.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.246.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.247.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.248.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.249.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.250.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.251.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.252.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.253.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.254.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.gate_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.up_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.down_proj.weight": "model-00141-of-000163.safetensors", + "model.layers.53.mlp.experts.255.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", + "model.layers.53.input_layernorm.weight": "model-00141-of-000163.safetensors", + "model.layers.53.post_attention_layernorm.weight": "model-00141-of-000163.safetensors", + "model.layers.54.self_attn.q_a_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.q_a_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.q_a_layernorm.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.q_b_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.q_b_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_a_proj_with_mqa.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_a_layernorm.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_b_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.kv_b_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.o_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.self_attn.o_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.gate.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.gate.e_score_correction_bias": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.shared_experts.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.0.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.1.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.2.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.3.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.4.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.5.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.6.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.7.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.8.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.9.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.10.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.11.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.12.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.13.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.14.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.15.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.16.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.17.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.18.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.19.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.20.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.21.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.22.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.23.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.24.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.25.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.26.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.27.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.28.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.29.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.30.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.31.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.32.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.33.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.34.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.35.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.36.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.37.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.38.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.39.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.40.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.41.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.42.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.43.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.44.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.45.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.46.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.47.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.48.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.49.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.50.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.51.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.52.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.53.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.54.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.55.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.56.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.57.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.58.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.59.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.60.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.61.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.62.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.63.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.64.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.65.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.66.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.67.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.68.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.69.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.70.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.71.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.72.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.73.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.74.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.75.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.76.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.77.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.78.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.79.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.80.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.81.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.82.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.83.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.84.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.85.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.86.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.87.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.88.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.89.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.90.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.up_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.down_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.91.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00142-of-000163.safetensors", + "model.layers.54.mlp.experts.92.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.92.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.92.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.92.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.92.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.93.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.94.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.95.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.96.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.97.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.98.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.99.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.100.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.101.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.102.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.103.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.104.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.105.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.106.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.107.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.108.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.109.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.110.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.111.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.112.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.113.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.114.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.115.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.116.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.117.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.118.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.119.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.120.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.121.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.122.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.123.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.124.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.125.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.126.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.127.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.128.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.129.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.130.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.131.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.132.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.133.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.134.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.135.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.136.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.137.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.138.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.139.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.140.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.141.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.142.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.143.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.144.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.145.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.146.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.147.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.148.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.149.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.150.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.151.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.152.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.153.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.154.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.155.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.156.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.157.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.158.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.159.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.160.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.161.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.162.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.163.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.164.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.165.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.166.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.167.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.168.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.169.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.170.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.171.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.172.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.173.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.174.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.175.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.176.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.177.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.178.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.179.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.180.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.181.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.182.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.183.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.184.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.185.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.186.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.187.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.188.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.gate_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.up_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.down_proj.weight": "model-00143-of-000163.safetensors", + "model.layers.54.mlp.experts.189.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.190.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.191.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.192.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.193.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.194.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.195.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.196.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.197.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.198.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.199.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.200.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.201.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.202.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.203.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.204.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.205.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.206.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.207.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.208.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.209.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.210.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.211.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.212.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.213.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.214.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.215.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.216.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.217.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.218.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.219.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.220.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.221.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.222.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.223.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.224.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.225.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.226.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.227.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.228.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.229.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.230.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.231.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.232.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.233.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.234.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.235.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.236.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.237.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.238.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.239.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.240.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.241.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.242.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.243.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.244.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.245.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.246.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.247.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.248.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.249.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.250.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.251.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.252.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.253.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.254.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.54.mlp.experts.255.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.54.input_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.54.post_attention_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_a_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_a_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_a_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_b_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.q_b_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_a_proj_with_mqa.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_a_layernorm.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_b_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.kv_b_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.o_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.self_attn.o_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.gate.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.gate.e_score_correction_bias": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.shared_experts.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.0.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.1.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.2.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.3.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.4.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.5.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.6.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.7.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.8.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.9.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.10.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.11.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.12.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.13.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.14.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.15.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.16.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.17.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.18.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.19.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.20.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.21.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.22.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.23.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.24.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.up_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.down_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.25.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00144-of-000163.safetensors", + "model.layers.55.mlp.experts.26.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.26.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.26.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.26.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.26.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.27.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.28.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.29.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.30.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.31.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.32.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.33.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.34.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.35.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.36.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.37.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.38.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.39.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.40.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.41.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.42.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.43.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.44.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.45.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.46.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.47.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.48.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.49.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.50.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.51.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.52.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.53.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.54.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.55.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.56.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.57.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.58.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.59.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.60.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.61.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.62.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.63.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.64.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.65.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.66.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.67.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.68.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.69.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.70.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.71.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.72.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.73.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.74.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.75.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.76.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.77.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.78.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.79.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.80.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.81.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.82.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.83.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.84.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.85.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.86.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.87.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.88.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.89.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.90.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.91.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.92.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.93.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.94.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.95.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.96.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.97.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.98.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.99.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.100.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.101.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.102.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.103.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.104.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.105.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.106.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.107.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.108.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.109.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.110.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.111.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.112.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.113.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.114.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.115.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.116.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.117.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.118.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.119.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.120.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.121.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.122.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.up_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.down_proj.weight": "model-00145-of-000163.safetensors", + "model.layers.55.mlp.experts.123.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.124.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.125.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.126.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.127.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.128.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.129.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.130.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.131.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.132.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.133.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.134.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.135.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.136.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.137.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.138.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.139.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.140.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.141.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.142.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.143.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.144.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.145.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.146.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.147.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.148.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.149.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.150.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.151.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.152.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.153.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.154.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.155.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.156.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.157.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.158.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.159.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.160.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.161.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.162.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.163.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.164.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.165.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.166.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.167.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.168.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.169.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.170.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.171.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.172.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.173.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.174.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.175.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.176.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.177.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.178.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.179.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.180.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.181.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.182.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.183.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.184.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.185.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.186.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.187.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.188.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.189.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.190.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.191.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.192.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.193.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.194.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.195.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.196.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.197.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.198.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.199.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.200.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.201.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.202.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.203.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.204.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.205.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.206.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.207.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.208.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.209.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.210.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.211.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.212.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.213.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.214.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.215.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.216.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.217.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.218.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.219.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.down_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.220.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.gate_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.up_proj.weight": "model-00146-of-000163.safetensors", + "model.layers.55.mlp.experts.221.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.221.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.221.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.222.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.223.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.224.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.225.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.226.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.227.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.228.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.229.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.230.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.231.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.232.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.233.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.234.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.235.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.236.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.237.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.238.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.239.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.240.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.241.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.242.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.243.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.244.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.245.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.246.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.247.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.248.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.249.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.250.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.251.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.252.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.253.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.254.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.55.mlp.experts.255.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.55.input_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.55.post_attention_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_a_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_a_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_a_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_b_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.q_b_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_a_proj_with_mqa.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_a_layernorm.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_b_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.kv_b_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.o_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.self_attn.o_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.gate.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.gate.e_score_correction_bias": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.shared_experts.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.0.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.1.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.2.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.3.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.4.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.5.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.6.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.7.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.8.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.9.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.10.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.11.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.12.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.13.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.14.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.15.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.16.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.17.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.18.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.19.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.20.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.21.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.22.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.23.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.24.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.25.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.26.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.27.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.28.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.29.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.30.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.31.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.32.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.33.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.34.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.35.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.36.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.37.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.38.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.39.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.40.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.41.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.42.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.43.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.44.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.45.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.46.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.47.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.48.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.49.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.50.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.51.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.52.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.53.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.54.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.55.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.56.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.up_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.down_proj.weight": "model-00147-of-000163.safetensors", + "model.layers.56.mlp.experts.57.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.58.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.59.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.60.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.61.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.62.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.63.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.64.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.65.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.66.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.67.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.68.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.69.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.70.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.71.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.72.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.73.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.74.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.75.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.76.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.77.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.78.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.79.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.80.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.81.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.82.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.83.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.84.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.85.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.86.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.87.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.88.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.89.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.90.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.91.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.92.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.93.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.94.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.95.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.96.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.97.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.98.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.99.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.100.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.101.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.102.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.103.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.104.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.105.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.106.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.107.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.108.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.109.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.110.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.111.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.112.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.113.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.114.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.115.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.116.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.117.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.118.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.119.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.120.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.121.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.122.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.123.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.124.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.125.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.126.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.127.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.128.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.129.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.130.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.131.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.132.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.133.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.134.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.135.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.136.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.137.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.138.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.139.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.140.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.141.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.142.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.143.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.144.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.145.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.146.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.147.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.148.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.149.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.150.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.151.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.152.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.153.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.down_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.154.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.up_proj.weight": "model-00148-of-000163.safetensors", + "model.layers.56.mlp.experts.155.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.155.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.155.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.156.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.157.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.158.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.159.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.160.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.161.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.162.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.163.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.164.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.165.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.166.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.167.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.168.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.169.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.170.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.171.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.172.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.173.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.174.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.175.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.176.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.177.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.178.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.179.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.180.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.181.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.182.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.183.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.184.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.185.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.186.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.187.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.188.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.189.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.190.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.191.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.192.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.193.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.194.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.195.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.196.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.197.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.198.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.199.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.200.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.201.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.202.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.203.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.204.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.205.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.206.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.207.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.208.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.209.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.210.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.211.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.212.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.213.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.214.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.215.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.216.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.217.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.218.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.219.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.220.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.221.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.222.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.223.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.224.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.225.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.226.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.227.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.228.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.229.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.230.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.231.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.232.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.233.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.234.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.235.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.236.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.237.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.238.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.239.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.240.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.241.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.242.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.243.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.244.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.245.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.246.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.247.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.248.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.249.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.250.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.251.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.up_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.down_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.252.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.253.gate_proj.weight": "model-00149-of-000163.safetensors", + "model.layers.56.mlp.experts.253.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.253.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.253.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.253.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.253.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.254.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.56.mlp.experts.255.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.56.input_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.56.post_attention_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_a_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_a_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_a_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_b_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.q_b_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_a_proj_with_mqa.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_a_layernorm.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_b_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.kv_b_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.o_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.self_attn.o_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.gate.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.gate.e_score_correction_bias": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.shared_experts.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.0.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.1.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.2.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.3.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.4.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.5.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.6.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.7.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.8.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.9.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.10.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.11.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.12.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.13.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.14.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.15.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.16.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.17.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.18.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.19.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.20.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.21.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.22.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.23.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.24.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.25.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.26.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.27.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.28.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.29.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.30.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.31.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.32.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.33.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.34.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.35.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.36.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.37.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.38.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.39.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.40.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.41.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.42.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.43.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.44.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.45.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.46.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.47.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.48.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.49.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.50.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.51.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.52.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.53.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.54.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.55.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.56.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.57.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.58.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.59.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.60.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.61.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.62.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.63.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.64.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.65.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.66.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.67.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.68.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.69.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.70.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.71.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.72.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.73.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.74.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.75.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.76.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.77.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.78.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.79.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.80.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.81.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.82.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.83.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.84.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.85.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.86.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.87.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.down_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.88.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.up_proj.weight": "model-00150-of-000163.safetensors", + "model.layers.57.mlp.experts.89.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.89.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.89.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.90.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.91.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.92.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.93.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.94.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.95.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.96.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.97.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.98.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.99.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.100.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.101.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.102.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.103.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.104.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.105.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.106.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.107.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.108.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.109.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.110.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.111.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.112.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.113.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.114.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.115.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.116.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.117.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.118.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.119.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.120.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.121.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.122.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.123.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.124.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.125.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.126.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.127.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.128.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.129.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.130.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.131.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.132.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.133.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.134.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.135.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.136.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.137.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.138.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.139.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.140.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.141.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.142.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.143.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.144.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.145.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.146.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.147.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.148.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.149.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.150.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.151.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.152.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.153.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.154.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.155.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.156.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.157.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.158.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.159.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.160.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.161.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.162.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.163.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.164.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.165.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.166.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.167.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.168.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.169.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.170.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.171.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.172.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.173.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.174.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.175.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.176.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.177.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.178.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.179.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.180.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.181.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.182.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.183.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.184.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.185.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.up_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.down_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.186.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.187.gate_proj.weight": "model-00151-of-000163.safetensors", + "model.layers.57.mlp.experts.187.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.187.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.187.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.187.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.187.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.188.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.189.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.190.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.191.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.192.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.193.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.194.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.195.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.196.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.197.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.198.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.199.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.200.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.201.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.202.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.203.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.204.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.205.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.206.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.207.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.208.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.209.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.210.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.211.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.212.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.213.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.214.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.215.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.216.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.217.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.218.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.219.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.220.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.221.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.222.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.223.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.224.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.225.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.226.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.227.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.228.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.229.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.230.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.231.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.232.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.233.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.234.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.235.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.236.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.237.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.238.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.239.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.240.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.241.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.242.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.243.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.244.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.245.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.246.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.247.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.248.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.249.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.250.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.251.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.252.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.253.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.254.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.57.mlp.experts.255.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.57.input_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.57.post_attention_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_a_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_a_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_a_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_b_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.q_b_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_a_proj_with_mqa.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_a_layernorm.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_b_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.kv_b_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.o_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.self_attn.o_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.gate.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.gate.e_score_correction_bias": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.shared_experts.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.0.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.1.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.2.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.3.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.4.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.5.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.6.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.7.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.8.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.9.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.10.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.11.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.12.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.13.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.14.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.15.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.16.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.17.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.18.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.19.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.20.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.21.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.down_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.22.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.up_proj.weight": "model-00152-of-000163.safetensors", + "model.layers.58.mlp.experts.23.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.23.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.23.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.24.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.25.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.26.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.27.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.28.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.29.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.30.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.31.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.32.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.33.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.34.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.35.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.36.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.37.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.38.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.39.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.40.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.41.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.42.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.43.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.44.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.45.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.46.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.47.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.48.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.49.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.50.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.51.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.52.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.53.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.54.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.55.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.56.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.57.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.58.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.59.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.60.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.61.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.62.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.63.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.64.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.65.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.66.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.67.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.68.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.69.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.70.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.71.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.72.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.73.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.74.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.75.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.76.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.77.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.78.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.79.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.80.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.81.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.82.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.83.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.84.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.85.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.86.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.87.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.88.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.89.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.90.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.91.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.92.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.93.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.94.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.95.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.96.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.97.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.98.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.99.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.100.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.101.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.102.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.103.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.104.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.105.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.106.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.107.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.108.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.109.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.110.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.111.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.112.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.113.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.114.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.115.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.116.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.117.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.118.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.119.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.up_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.down_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.120.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00153-of-000163.safetensors", + "model.layers.58.mlp.experts.121.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.121.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.121.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.121.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.121.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.122.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.123.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.124.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.125.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.126.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.127.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.128.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.129.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.130.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.131.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.132.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.133.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.134.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.135.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.136.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.137.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.138.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.139.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.140.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.141.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.142.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.143.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.144.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.145.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.146.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.147.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.148.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.149.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.150.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.151.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.152.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.153.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.154.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.155.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.156.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.157.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.158.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.159.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.160.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.161.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.162.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.163.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.164.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.165.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.166.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.167.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.168.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.169.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.170.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.171.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.172.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.173.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.174.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.175.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.176.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.177.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.178.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.179.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.180.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.181.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.182.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.183.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.184.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.185.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.186.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.187.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.188.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.189.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.190.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.191.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.192.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.193.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.194.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.195.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.196.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.197.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.198.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.199.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.200.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.201.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.202.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.203.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.204.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.205.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.206.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.207.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.208.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.209.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.210.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.211.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.212.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.213.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.214.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.215.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.216.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.217.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.gate_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.up_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.down_proj.weight": "model-00154-of-000163.safetensors", + "model.layers.58.mlp.experts.218.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.219.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.220.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.221.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.222.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.223.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.224.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.225.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.226.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.227.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.228.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.229.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.230.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.231.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.232.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.233.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.234.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.235.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.236.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.237.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.238.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.239.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.240.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.241.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.242.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.243.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.244.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.245.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.246.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.247.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.248.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.249.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.250.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.251.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.252.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.253.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.254.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.58.mlp.experts.255.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.58.input_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.58.post_attention_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_a_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_a_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_a_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_b_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.q_b_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_a_proj_with_mqa.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_a_layernorm.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_b_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.kv_b_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.o_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.self_attn.o_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.gate.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.gate.e_score_correction_bias": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.shared_experts.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.0.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.1.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.2.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.3.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.4.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.5.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.6.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.7.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.8.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.9.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.10.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.11.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.12.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.13.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.14.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.15.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.16.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.17.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.18.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.19.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.20.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.21.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.22.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.23.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.24.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.25.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.26.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.27.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.28.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.29.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.30.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.31.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.32.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.33.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.34.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.35.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.36.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.37.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.38.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.39.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.40.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.41.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.42.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.43.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.44.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.45.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.46.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.47.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.48.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.49.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.50.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.51.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.52.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.53.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.up_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.down_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.54.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00155-of-000163.safetensors", + "model.layers.59.mlp.experts.55.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.55.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.55.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.55.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.55.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.56.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.57.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.58.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.59.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.60.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.61.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.62.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.63.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.64.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.65.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.66.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.67.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.68.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.69.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.70.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.71.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.72.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.73.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.74.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.75.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.76.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.77.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.78.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.79.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.80.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.81.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.82.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.83.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.84.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.85.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.86.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.87.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.88.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.89.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.90.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.91.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.92.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.93.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.94.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.95.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.96.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.97.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.98.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.99.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.100.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.101.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.102.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.103.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.104.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.105.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.106.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.107.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.108.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.109.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.110.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.111.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.112.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.113.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.114.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.115.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.116.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.117.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.118.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.119.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.120.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.121.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.122.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.123.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.124.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.125.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.126.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.127.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.128.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.129.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.130.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.131.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.132.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.133.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.134.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.135.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.136.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.137.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.138.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.139.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.140.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.141.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.142.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.143.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.144.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.145.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.146.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.147.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.148.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.149.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.150.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.151.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.up_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.down_proj.weight": "model-00156-of-000163.safetensors", + "model.layers.59.mlp.experts.152.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.153.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.154.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.155.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.156.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.157.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.158.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.159.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.160.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.161.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.162.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.163.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.164.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.165.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.166.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.167.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.168.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.169.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.170.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.171.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.172.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.173.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.174.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.175.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.176.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.177.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.178.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.179.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.180.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.181.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.182.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.183.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.184.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.185.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.186.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.187.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.188.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.189.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.190.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.191.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.192.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.193.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.194.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.195.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.196.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.197.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.198.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.199.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.200.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.201.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.202.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.203.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.204.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.205.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.206.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.207.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.208.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.209.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.210.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.211.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.212.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.213.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.214.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.215.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.216.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.217.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.218.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.219.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.220.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.221.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.222.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.223.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.224.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.225.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.226.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.227.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.228.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.229.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.230.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.231.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.232.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.233.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.234.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.235.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.236.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.237.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.238.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.239.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.240.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.241.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.242.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.243.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.244.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.245.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.246.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.247.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.248.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.down_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.249.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.gate_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.up_proj.weight": "model-00157-of-000163.safetensors", + "model.layers.59.mlp.experts.250.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.250.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.250.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.251.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.252.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.253.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.254.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.59.mlp.experts.255.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.59.input_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.59.post_attention_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_a_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_a_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_a_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_b_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.q_b_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_a_proj_with_mqa.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_a_layernorm.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_b_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.kv_b_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.o_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.self_attn.o_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.gate.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.gate.e_score_correction_bias": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.shared_experts.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.0.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.1.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.2.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.3.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.4.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.5.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.6.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.7.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.8.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.9.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.10.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.11.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.12.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.13.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.14.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.15.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.16.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.17.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.18.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.19.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.20.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.21.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.22.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.23.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.24.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.25.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.26.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.27.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.28.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.29.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.30.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.31.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.32.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.33.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.34.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.35.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.36.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.37.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.38.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.39.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.40.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.41.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.42.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.43.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.44.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.45.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.46.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.47.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.48.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.49.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.50.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.51.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.52.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.53.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.54.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.55.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.56.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.57.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.58.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.59.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.60.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.61.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.62.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.63.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.64.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.65.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.66.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.67.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.68.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.69.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.70.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.71.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.72.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.73.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.74.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.75.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.76.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.77.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.78.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.79.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.80.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.81.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.82.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.83.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.84.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.85.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.up_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.down_proj.weight": "model-00158-of-000163.safetensors", + "model.layers.60.mlp.experts.86.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.87.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.88.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.89.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.90.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.91.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.92.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.93.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.94.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.95.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.96.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.97.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.98.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.99.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.100.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.101.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.102.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.103.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.104.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.105.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.106.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.107.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.108.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.109.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.110.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.111.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.112.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.113.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.114.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.115.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.116.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.117.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.118.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.119.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.120.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.121.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.122.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.123.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.124.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.125.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.126.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.127.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.128.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.129.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.130.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.131.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.132.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.133.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.134.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.135.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.136.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.137.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.138.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.139.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.140.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.141.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.142.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.143.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.144.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.145.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.146.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.147.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.148.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.149.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.150.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.151.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.152.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.153.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.154.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.155.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.156.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.157.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.158.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.159.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.160.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.161.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.162.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.163.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.164.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.165.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.166.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.167.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.168.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.169.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.170.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.171.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.172.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.173.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.174.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.175.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.176.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.177.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.178.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.179.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.180.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.181.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.182.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.down_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.183.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.gate_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.up_proj.weight": "model-00159-of-000163.safetensors", + "model.layers.60.mlp.experts.184.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.184.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.184.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.185.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.186.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.187.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.188.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.189.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.190.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.191.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.192.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.193.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.194.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.195.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.196.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.197.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.198.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.199.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.200.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.201.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.202.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.203.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.204.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.205.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.206.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.207.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.208.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.209.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.210.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.211.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.212.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.213.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.214.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.215.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.216.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.217.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.218.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.219.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.220.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.221.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.222.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.223.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.224.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.225.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.226.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.227.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.228.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.229.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.230.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.231.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.232.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.233.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.234.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.235.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.236.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.237.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.238.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.239.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.240.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.241.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.242.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.243.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.244.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.245.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.246.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.247.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.248.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.249.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.250.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.251.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.252.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.253.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.254.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.60.mlp.experts.255.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.60.input_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.60.post_attention_layernorm.weight": "model-00160-of-000163.safetensors", + "model.norm.weight": "model-00160-of-000163.safetensors", + "lm_head.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_a_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_a_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_a_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_b_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.q_b_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_a_proj_with_mqa.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_a_layernorm.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_b_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.kv_b_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.o_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.self_attn.o_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.gate.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.gate.e_score_correction_bias": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.gate_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.up_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.down_proj.weight": "model-00160-of-000163.safetensors", + "model.layers.61.mlp.shared_experts.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.0.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.1.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.2.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.3.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.4.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.5.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.6.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.7.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.8.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.9.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.10.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.11.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.12.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.13.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.14.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.15.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.16.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.17.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.18.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.19.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.20.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.21.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.22.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.23.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.24.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.25.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.26.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.27.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.28.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.29.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.30.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.31.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.32.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.33.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.34.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.35.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.36.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.37.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.38.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.39.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.40.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.41.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.42.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.43.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.44.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.45.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.46.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.47.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.48.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.49.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.50.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.51.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.52.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.53.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.54.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.55.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.56.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.57.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.58.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.59.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.60.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.61.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.62.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.63.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.64.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.65.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.66.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.67.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.68.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.69.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.70.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.71.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.72.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.73.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.74.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.75.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.76.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.77.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.78.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.79.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.80.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.81.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.82.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.83.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.84.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.85.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.86.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.87.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.88.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.89.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.90.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.91.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.92.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.93.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.94.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.95.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.down_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.96.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.gate_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.up_proj.weight": "model-00161-of-000163.safetensors", + "model.layers.61.mlp.experts.97.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.97.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.97.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.98.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.99.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.100.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.101.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.102.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.103.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.104.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.105.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.106.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.107.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.108.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.109.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.110.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.111.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.112.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.113.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.114.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.115.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.116.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.117.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.118.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.119.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.120.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.121.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.122.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.123.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.124.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.125.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.126.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.127.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.128.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.129.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.130.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.131.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.132.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.133.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.134.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.135.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.136.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.137.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.138.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.139.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.140.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.141.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.142.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.143.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.144.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.145.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.146.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.147.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.148.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.149.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.150.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.151.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.152.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.153.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.154.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.155.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.156.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.157.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.158.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.159.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.160.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.161.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.162.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.163.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.164.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.165.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.166.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.167.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.168.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.169.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.170.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.171.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.172.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.173.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.174.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.175.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.176.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.177.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.178.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.179.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.180.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.181.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.182.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.183.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.184.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.185.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.186.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.187.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.188.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.189.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.190.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.191.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.192.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.193.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.up_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.down_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.194.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.195.gate_proj.weight": "model-00162-of-000163.safetensors", + "model.layers.61.mlp.experts.195.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.195.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.195.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.195.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.195.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.196.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.197.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.198.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.199.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.200.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.201.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.202.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.203.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.204.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.205.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.206.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.207.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.208.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.209.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.210.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.211.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.212.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.213.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.214.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.215.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.216.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.217.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.218.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.219.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.220.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.221.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.222.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.223.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.224.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.225.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.226.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.227.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.228.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.229.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.230.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.231.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.232.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.233.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.234.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.235.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.236.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.237.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.238.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.239.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.240.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.241.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.242.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.243.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.244.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.245.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.246.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.247.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.248.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.249.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.250.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.251.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.252.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.253.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.254.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.gate_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.up_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.down_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.mlp.experts.255.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", + "model.layers.61.input_layernorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.post_attention_layernorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.embed_tokens.weight": "model-00163-of-000163.safetensors", + "model.layers.61.enorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.hnorm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.eh_proj.weight": "model-00163-of-000163.safetensors", + "model.layers.61.shared_head.norm.weight": "model-00163-of-000163.safetensors", + "model.layers.61.shared_head.head.weight": "model-00163-of-000163.safetensors" + } +} \ No newline at end of file diff --git a/README.md b/README.md index 17ae1ac75ada0d94d3382ed604a7e18d91406567..7f315a1451f18848de55ca70a85d65b7f843e621 100644 --- a/README.md +++ b/README.md @@ -10,21 +10,201 @@ tags: - unsloth - transformers --- -
-

- deepseek-ai/DeepSeek-V3-0324 -

-
- - - - - - - - - -
+ +# DeepSeek-V3-0324 + + + + +
+ DeepSeek-V3 +
+
+
+ + Homepage + + + Chat + + + Hugging Face + +
+ +
+ + Discord + + + Wechat + + + Twitter Follow + +
+ +
+ + License +
-Thank you to the DeepSeek team for releasing their March update to the DeepSeek V3 models. \ No newline at end of file +## Features + +DeepSeek-V3-0324 demonstrates notable improvements over its predecessor, DeepSeek-V3, in several key aspects. + +![Model Performance](figures/0324_comparison.png) + +### Reasoning Capabilities + +- Significant improvements in benchmark performance: + - MMLU-Pro: 75.9 → 81.2 (+5.3) + - GPQA: 59.1 → 68.4 (+9.3) + - AIME: 39.6 → 59.4 (+19.8) + - LiveCodeBench: 39.2 → 49.2 (+10.0) + +### Front-End Web Development + +- Improved the executability of the code +- More aesthetically pleasing web pages and game front-ends + +### Chinese Writing Proficiency + +- Enhanced style and content quality: + - Aligned with the R1 writing style + - Better quality in medium-to-long-form writing + +- Feature Enhancements + - Improved multi-turn interactive rewriting + - Optimized translation quality and letter writing + +### Chinese Search Capabilities + +- Enhanced report analysis requests with more detailed outputs + +### Function Calling Improvements + +- Increased accuracy in Function Calling, fixing issues from previous V3 versions + +--- + +## Usage Recommendations + +### System Prompt + +In the official DeepSeek web/app, we use the same system prompt with a specific date. + +``` +该助手为DeepSeek Chat,由深度求索公司创造。 +今天是{current date}。 +``` + +For example, + +``` +该助手为DeepSeek Chat,由深度求索公司创造。 +今天是3月24日,星期一。 +``` + +### Temperature + +In our web and application environments, the temperature parameter $T_{model}$ is set to 0.3. Because many users use the default temperature 1.0 in API call, we have implemented an API temperature $T_{api}$ mapping mechanism that adjusts the input API temperature value of 1.0 to the most suitable model temperature setting of 0.3. + +$$ +T_{model} = T_{api} \times 0.3 \quad (0 \leq T_{api} \leq 1) +$$ + +$$ +T_{model} = T_{api} - 0.7 \quad (1 < T_{api} \leq 2) +$$ + +Thus, if you call V3 via API, temperature 1.0 equals to the model temperature 0.3. + +### Prompts for File Uploading and Web Search + +For file uploading, please follow the template to create prompts, where {file_name}, {file_content} and {question} are arguments. + +``` +file_template = \ +"""[file name]: {file_name} +[file content begin] +{file_content} +[file content end] +{question}""" +``` + +For Web Search, {search_results}, {cur_date}, and {question} are arguments. + +For Chinese query, we use the prompt: + +``` +search_answer_zh_template = \ +'''# 以下内容是基于用户发送的消息的搜索结果: +{search_results} +在我给你的搜索结果中,每个结果都是[webpage X begin]...[webpage X end]格式的,X代表每篇文章的数字索引。请在适当的情况下在句子末尾引用上下文。请按照引用编号[citation:X]的格式在答案中对应部分引用上下文。如果一句话源自多个上下文,请列出所有相关的引用编号,例如[citation:3][citation:5],切记不要将引用集中在最后返回引用编号,而是在答案对应部分列出。 +在回答时,请注意以下几点: +- 今天是{cur_date}。 +- 并非搜索结果的所有内容都与用户的问题密切相关,你需要结合问题,对搜索结果进行甄别、筛选。 +- 对于列举类的问题(如列举所有航班信息),尽量将答案控制在10个要点以内,并告诉用户可以查看搜索来源、获得完整信息。优先提供信息完整、最相关的列举项;如非必要,不要主动告诉用户搜索结果未提供的内容。 +- 对于创作类的问题(如写论文),请务必在正文的段落中引用对应的参考编号,例如[citation:3][citation:5],不能只在文章末尾引用。你需要解读并概括用户的题目要求,选择合适的格式,充分利用搜索结果并抽取重要信息,生成符合用户要求、极具思想深度、富有创造力与专业性的答案。你的创作篇幅需要尽可能延长,对于每一个要点的论述要推测用户的意图,给出尽可能多角度的回答要点,且务必信息量大、论述详尽。 +- 如果回答很长,请尽量结构化、分段落总结。如果需要分点作答,尽量控制在5个点以内,并合并相关的内容。 +- 对于客观类的问答,如果问题的答案非常简短,可以适当补充一到两句相关信息,以丰富内容。 +- 你需要根据用户要求和回答内容选择合适、美观的回答格式,确保可读性强。 +- 你的回答应该综合多个相关网页来回答,不能重复引用一个网页。 +- 除非用户要求,否则你回答的语言需要和用户提问的语言保持一致。 + +# 用户消息为: +{question}''' +``` + +For English query, we use the prompt: + +``` +search_answer_en_template = \ +'''# The following contents are the search results related to the user's message: +{search_results} +In the search results I provide to you, each result is formatted as [webpage X begin]...[webpage X end], where X represents the numerical index of each article. Please cite the context at the end of the relevant sentence when appropriate. Use the citation format [citation:X] in the corresponding part of your answer. If a sentence is derived from multiple contexts, list all relevant citation numbers, such as [citation:3][citation:5]. Be sure not to cluster all citations at the end; instead, include them in the corresponding parts of the answer. +When responding, please keep the following points in mind: +- Today is {cur_date}. +- Not all content in the search results is closely related to the user's question. You need to evaluate and filter the search results based on the question. +- For listing-type questions (e.g., listing all flight information), try to limit the answer to 10 key points and inform the user that they can refer to the search sources for complete information. Prioritize providing the most complete and relevant items in the list. Avoid mentioning content not provided in the search results unless necessary. +- For creative tasks (e.g., writing an essay), ensure that references are cited within the body of the text, such as [citation:3][citation:5], rather than only at the end of the text. You need to interpret and summarize the user's requirements, choose an appropriate format, fully utilize the search results, extract key information, and generate an answer that is insightful, creative, and professional. Extend the length of your response as much as possible, addressing each point in detail and from multiple perspectives, ensuring the content is rich and thorough. +- If the response is lengthy, structure it well and summarize it in paragraphs. If a point-by-point format is needed, try to limit it to 5 points and merge related content. +- For objective Q&A, if the answer is very brief, you may add one or two related sentences to enrich the content. +- Choose an appropriate and visually appealing format for your response based on the user's requirements and the content of the answer, ensuring strong readability. +- Your answer should synthesize information from multiple relevant webpages and avoid repeatedly citing the same webpage. +- Unless the user requests otherwise, your response should be in the same language as the user's question. + +# The user's message is: +{question}''' +``` + +## How to Run Locally + +The model structure of DeepSeek-V3-0324 is exactly the same as DeepSeek-V3. Please visit [DeepSeek-V3](https://github.com/deepseek-ai/DeepSeek-V3) repo for more information about running this model locally. + +**This model supports features such as function calling, JSON output, and FIM completion. For instructions on how to construct prompts to use these features, please refer to [DeepSeek-V2.5](https://huggingface.co/deepseek-ai/DeepSeek-V2.5#function-calling) repo.** + +**NOTE: Hugging Face's Transformers has not been directly supported yet.** + +## License + +This repository and the model weights are licensed under the [MIT License](LICENSE). + +## Citation + +``` +@misc{deepseekai2024deepseekv3technicalreport, + title={DeepSeek-V3 Technical Report}, + author={DeepSeek-AI}, + year={2024}, + eprint={2412.19437}, + archivePrefix={arXiv}, + primaryClass={cs.CL}, + url={https://arxiv.org/abs/2412.19437}, +} +``` + +## Contact +If you have any questions, please raise an issue or contact us at [service@deepseek.com](service@deepseek.com). diff --git a/model-00002-of-000163.safetensors b/model-00002-of-000163.safetensors index 9dfc29c0ae65b9ee990fed9d7642fb17c8e9b711..3acbb57eabe8cd668dea59d310b7abf8a50b9372 100644 --- a/model-00002-of-000163.safetensors +++ b/model-00002-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:400b76ca459923cc0c710ca51e05c8aa6167f595af208c15107800394a66a504 -size 4302383966 +oid sha256:5844015b9f68e501e8538508d1b31c5afe689179b325338a7674fbd5e379d40a +size 8602553952 diff --git a/model-00003-of-000163.safetensors b/model-00003-of-000163.safetensors index 7fc7f738a63ff3423eb7455a9eb77f8bdd676632..53f2d2c043a8da80af96c142b95cf8697a1e5bc1 100644 --- a/model-00003-of-000163.safetensors +++ b/model-00003-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1e0192d491a2cad015aed550f8c072c69dbea143e9f55074b4f5b513c0633026 -size 4302384375 +oid sha256:53d4aa08b71670df1fe00c8899400d1aee1cc94093b6828f22819b6f67ab866a +size 8602554152 diff --git a/model-00005-of-000163.safetensors b/model-00005-of-000163.safetensors index 17dc251016f414f67871393988701550a9e07d44..00d80a12289768816ed38d05bc94b26471f53294 100644 --- a/model-00005-of-000163.safetensors +++ b/model-00005-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1973c53f492006ff0eb70d677ebfa42bc40d2cafc1e15e64eb600765bfe7b7c1 -size 4302384154 +oid sha256:9eb020c759e3bde40e4f954df8c1cf486cd7b83f05f30ba1b83d06ae7c7d03e0 +size 8602554048 diff --git a/model-00006-of-000163.safetensors b/model-00006-of-000163.safetensors index 3efcac392549d551145f83d316c03e8b42a9cae3..c24437380426b0eb56133d4eec437c7b3d9a6ed8 100644 --- a/model-00006-of-000163.safetensors +++ b/model-00006-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2250eb7be1d22707f2effe99562de640b55980c2913e0640fa24d571cdfed642 -size 4372073602 +oid sha256:bbc4c8652b9d2d65cf6a49ca20854abf95c4f735bd4a11a7bdd0de90dd336483 +size 8741916520 diff --git a/model-00007-of-000163.safetensors b/model-00007-of-000163.safetensors index e14978808ed88cfe95df4c0fb9fdfac630490074..269ea8bf81c9f7dbd82f6cd549046b2bedd5ad98 100644 --- a/model-00007-of-000163.safetensors +++ b/model-00007-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8632d0847cd3082d9b66edefcc72d80c717b3fe4535b3d68b808da3c8806bceb -size 4306080097 +oid sha256:3082978bbf5223818fa50fab0038a60f40809624b14b6d64de446523ecb403cb +size 8606225096 diff --git a/model-00008-of-000163.safetensors b/model-00008-of-000163.safetensors index 599012f2194c7e1c6a3af36fe5cabad24f3b22bb..f356c6772da854f5d19dbcacd31c7363b121c55f 100644 --- a/model-00008-of-000163.safetensors +++ b/model-00008-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:85daa7fd14a621a084a16c2669a8b95bad9173353fa9ec2f0fd6be6726866a32 -size 4302384356 +oid sha256:313c9b7cb3e366ed3d7b691ec89ecf1ad36431b24ed1820a8ff5e90e4043b5eb +size 8602554144 diff --git a/model-00010-of-000163.safetensors b/model-00010-of-000163.safetensors index 7995c64f59869cb432dcc0f5b7ff2888f42b5c09..840c331d521ff2ea1b8723a5318f5e871525da3a 100644 --- a/model-00010-of-000163.safetensors +++ b/model-00010-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0317ba8c85441b4f3d0134d2d43a1535e073250ba223283ceffc46bdef5dd77b -size 4302383960 +oid sha256:78d0922e547a2ead061adf26afa98b9be8bd57d831be435e91a5985ac749d34a +size 8602553952 diff --git a/model-00011-of-000163.safetensors b/model-00011-of-000163.safetensors index 02ebf54fdc28f8e232d260fff9f50fd88290fee1..8326ca62ee0d2653023c0e31406ab2ffcf484870 100644 --- a/model-00011-of-000163.safetensors +++ b/model-00011-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c5291900ff83cdf2786565e133d6b792313526df8e5cc17c120e0386426e66d7 -size 4302384375 +oid sha256:c6004755ecb9a6cc8b6c8956810fc4801b191df495cfd04f77af833fee85ca40 +size 8602554152 diff --git a/model-00012-of-000163.safetensors b/model-00012-of-000163.safetensors index b43976d0b4ecc66204435e6412f9b50946e388e5..d80e928c190383bfe53ddf3c5cfad6301994aca5 100644 --- a/model-00012-of-000163.safetensors +++ b/model-00012-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1596e384e28712a7da32481b414ad2f9d5205b7d914066aaa77861f52218e3e3 -size 1321583941 +oid sha256:914ef69f24bd9685a5af1705d7984cd0ac3155fd61b5f8a5f5bd2d6822a5311e +size 2642451624 diff --git a/model-00013-of-000163.safetensors b/model-00013-of-000163.safetensors index 51f994cc2d289b20295747152767a0dad226be46..9d4c3cabac70584bb7fc6a1ffd396b59a5131c84 100644 --- a/model-00013-of-000163.safetensors +++ b/model-00013-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0b5b8ac70defdc5393f02525d88ba2eb145f51ce9b2a11637de11b522d7c0da1 -size 4302317244 +oid sha256:0e550e63d81c1de11cea268eb8721d3ddf87059ea4f322e826ccd07a0090df06 +size 8598757320 diff --git a/model-00014-of-000163.safetensors b/model-00014-of-000163.safetensors index 0d47b1d1bacbca88687d914d22f3966935b8058e..95b358b4d3625fd846b2a271e731cba1b9eeff57 100644 --- a/model-00014-of-000163.safetensors +++ b/model-00014-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:df727377a86d6bc8b3ae4ac3f4fb0937c5476fb8b19edd28c0924d016e7199f4 -size 4302384328 +oid sha256:76582352e6517885d22e1ef70160a6eab8fb21ce66737c8c482331f8af0c4602 +size 8602554136 diff --git a/model-00015-of-000163.safetensors b/model-00015-of-000163.safetensors index 2045f55aace35a3df0d97bb66c7572a7d47fddbf..5e8f90687f7c7102a69d49513b3fa23f18c21439 100644 --- a/model-00015-of-000163.safetensors +++ b/model-00015-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ae96924ba8d4f9e56221316ac185b1b5655ad08fd6abb425288d70f8e867d3a2 -size 4302350218 +oid sha256:cf9c3a62fe407632067c2e4d82a4b193684b8ddd05c3214920e82a700a2ff185 +size 8598786408 diff --git a/model-00016-of-000163.safetensors b/model-00016-of-000163.safetensors index 0e4998444bd7e5529de6d1a86cffa8d0ebc7f20c..4a7e1664d48aa7a7bb568e7af52f7ea30b6eb1ae 100644 --- a/model-00016-of-000163.safetensors +++ b/model-00016-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:506313cbaf4ed810cf5d104229fdbc4e19cde2b12cea9e55e9550131b171409e -size 4302383932 +oid sha256:0f67a95e5ecab2fb3426a3cffcd67130f49a02123422aefc544812df5a234982 +size 8602553936 diff --git a/model-00017-of-000163.safetensors b/model-00017-of-000163.safetensors index e1e1086cda4adb005035415cb6c2b83a7bed42c5..54060071abac849b72fce24b2971d36864b634df 100644 --- a/model-00017-of-000163.safetensors +++ b/model-00017-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d396bde693edd1001be8440865e2c61b121d0cad562596e19ca01bf29dabcca4 -size 4302384377 +oid sha256:c1ad930269c70257aac8721b09e6a872b2c6c7acacc2fc03cd142cdf3a8df7af +size 8602554152 diff --git a/model-00018-of-000163.safetensors b/model-00018-of-000163.safetensors index 412f004e0f98503979da805147b02fe442bc46ef..e88b46379b50fa91e91756b6613e2520446e0049 100644 --- a/model-00018-of-000163.safetensors +++ b/model-00018-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4ebc50b2e0e220583a2597770d94f1a6c3e87be325470d0f4a15984bab424354 -size 4302350026 +oid sha256:478ef71639bacf1cf2ed23acfb98df6f9689589dfb0b795bbc6282a9f7e54253 +size 8598786312 diff --git a/model-00019-of-000163.safetensors b/model-00019-of-000163.safetensors index 53aff9795404ea7b325f9ae4cdeb26f6188dbb1c..8635337b9c3fa46031dfdec16d4e7d73028b6aa1 100644 --- a/model-00019-of-000163.safetensors +++ b/model-00019-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0a9d59229d198ee0b4966834d17d61811e8afe998e7634c87e643f51bc866d75 -size 4302384124 +oid sha256:eb1005b99407ca2b72ad988f6125cbb8d2f13b1e09818ee6a82140847082f422 +size 8602554032 diff --git a/model-00021-of-000163.safetensors b/model-00021-of-000163.safetensors index 86bbfb479bb4c18e28db7c116e1635f86470d551..eec6eb942ad80bb8c9e6573811151b13b8a1ddbf 100644 --- a/model-00021-of-000163.safetensors +++ b/model-00021-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8afd4121eeb804b11838f51f4b49598d0e66bafe40d70a2def88698901a595d6 -size 4302350413 +oid sha256:c218916efad7c04510b980e6bd7e3547e072cbff542dc8dea5bd22eecd448d91 +size 8598786512 diff --git a/model-00022-of-000163.safetensors b/model-00022-of-000163.safetensors index 2f5d3a30f670089153eb3d5cfbc557ef504ab979..a5f15dadf4e6841ab41e06d61488b25e1084de97 100644 --- a/model-00022-of-000163.safetensors +++ b/model-00022-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d6e5d4ea01bc15edb85b06f7d0ea9a41acf2efe18dd7c6bf1d85ddf2c4074fc0 -size 4302384900 +oid sha256:1e61b9c4bf542fbd3c739f70ff66c40848e7718736b224118563df7c4016280b +size 8602554416 diff --git a/model-00023-of-000163.safetensors b/model-00023-of-000163.safetensors index fb9c7747d4eb9f0a388b054c756d2a8bb132ecf7..f3e7566249cea6056a7ab119ba6f39ab341ee7c8 100644 --- a/model-00023-of-000163.safetensors +++ b/model-00023-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9406624825565d25194fdf9462b397b5acba0bcab3bf1bdf9601952280945269 -size 4302350808 +oid sha256:a76594d91b144550a1fdbb44b87815324bc006a08443e9e8119b98db0d24b85f +size 8598786704 diff --git a/model-00024-of-000163.safetensors b/model-00024-of-000163.safetensors index 30c773f5514a0cc50e0ce6fe3f4aa6711f0c0d8c..0a4dba927b64eeb4404d32027f083ff58fb810b1 100644 --- a/model-00024-of-000163.safetensors +++ b/model-00024-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:488969a9e8a378b243594f86144827dfb4c8549b3c6d719e21572a2306e742b4 -size 4302384504 +oid sha256:54efcb48e240c37fbf4ad61608c36145297474ebe81c7cf58f7da37d6f0b0cc9 +size 8602554224 diff --git a/model-00025-of-000163.safetensors b/model-00025-of-000163.safetensors index c8badf84570fc3b80d1748cecfffede8d0d601b2..9652edcb61451d60a47a6dc14b64fc6495727845 100644 --- a/model-00025-of-000163.safetensors +++ b/model-00025-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:450cc3f29910ee8d38ac5a5ec39901f83f63920bbc4d15175e5f5e58119dff29 -size 4302384961 +oid sha256:760df9cb8100d1014e4a6c286a7289af633793441dffa0e46bb138c8afcac88c +size 8602554448 diff --git a/model-00026-of-000163.safetensors b/model-00026-of-000163.safetensors index 65773bb139a2bdd913095abc9bedfc2d6d372d6a..01df38017d75569538fa42d8abc71dcd67758b82 100644 --- a/model-00026-of-000163.safetensors +++ b/model-00026-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bdfe115c31c700af118ca1f2f3cfb121c1d60e40404a688d63b686e8b54eacb7 -size 4302350620 +oid sha256:b1586bb9250ddaca3db7e5444dbdc7cbe5b06460d4d96dc88fc4bd7d27c61b0f +size 8598786616 diff --git a/model-00027-of-000163.safetensors b/model-00027-of-000163.safetensors index 5483b33d4f6af0bb84801bd535aeb5ca31f00f75..00604163ceba2c8eedcc56f7a7bf664492a95213 100644 --- a/model-00027-of-000163.safetensors +++ b/model-00027-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:13e981a9bdc7527d1d496ebe47456c7edd81d843c8125597d5ee640f18d65413 -size 4302384692 +oid sha256:890493f4a165a9674a9eadd3ec564d42fd6f6d64856549332bd6991cb83a87cb +size 8602554312 diff --git a/model-00028-of-000163.safetensors b/model-00028-of-000163.safetensors index e5eb594ccf40e5992f9c9edaf699ad86e898711c..b8af23a5b628d86c9a454de38d25ca6641eceb81 100644 --- a/model-00028-of-000163.safetensors +++ b/model-00028-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d767507070d19fa2736474f701a58317a9584e32df6d9bd010611f939c86049d -size 4302384963 +oid sha256:0e606831e47403d9ff9725d126281e0c326f9d7b6eca273a98640ba1b35c9655 +size 8602554448 diff --git a/model-00029-of-000163.safetensors b/model-00029-of-000163.safetensors index 2ecc5b8b58238c8fd8022e51fc9037b50097aed3..be92b2cb9d4c064d9918f39cb545c4c7cbd69173 100644 --- a/model-00029-of-000163.safetensors +++ b/model-00029-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:11b1ef947996f5426c462156be33547dbf1b08d8a12eca063d27889553e77470 -size 4302350448 +oid sha256:32ba974c0a902b5914a9dfdf386ec70431195c771398f03682148793eb970e4b +size 8598786520 diff --git a/model-00030-of-000163.safetensors b/model-00030-of-000163.safetensors index 72f3bfc48ddcee24cb5543aa5d56932fc52e3182..b728e143fe106a3cf88938b71c76403638527463 100644 --- a/model-00030-of-000163.safetensors +++ b/model-00030-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6ff7740ee8707ad1e058634afd4d8c525cc2dbd13d81be8bd3ebbe2d999b9461 -size 4302384884 +oid sha256:312eecba0c4fea75fca165e87b52601ec8635093416663aa1b24ece565398fbd +size 8602554408 diff --git a/model-00031-of-000163.safetensors b/model-00031-of-000163.safetensors index dca450dcb9592684dc9e5c84e3a9ae3b3cb20a25..1cb9a6e4823e1fa6220b7c94583b9bf4de975966 100644 --- a/model-00031-of-000163.safetensors +++ b/model-00031-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:07afa8b68a432adc61b74f5649265bb656efae1ffcd6da6f23549f6b53a2093a -size 4302350824 +oid sha256:02e585cab72857aea7829481367491d72201ea7e4c02344d4f1bf3add8dfb3c2 +size 8598786720 diff --git a/model-00032-of-000163.safetensors b/model-00032-of-000163.safetensors index 2582ceb58f4aeda00b04431268394e401f5a4ec0..e69a2f90a69b408b361cb06ef41fa5d31288eff9 100644 --- a/model-00032-of-000163.safetensors +++ b/model-00032-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:361f93b0bcbf04a2d5c99f2265d74c16d2ac6606fea1322633be0d4c578f93ac -size 4302384488 +oid sha256:e96b70c17e382f81e821a34afd358b495c80da1c3e5efe69ecc8825e0cadf686 +size 8602554208 diff --git a/model-00033-of-000163.safetensors b/model-00033-of-000163.safetensors index f8867787af4edbb7eb3631f2369bbe79e1203008..14f66d9710368d87dd3f74b95b19cd9bf6f601df 100644 --- a/model-00033-of-000163.safetensors +++ b/model-00033-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d5cd3a3bd61d43a159b186554e0d652d90ef80355a4d64cdfab2f09c59586ea1 -size 4302384963 +oid sha256:5135fe94706cc80b41920288bbde014ff0bc122fbea251a0e8a04351a2da76c9 +size 8602554448 diff --git a/model-00034-of-000163.safetensors b/model-00034-of-000163.safetensors index 61de97cf113b61a53b34288812bf5a87d8eb9873..a72ee25c0a9280eae5c01a55a3892e6c82b6a94d 100644 --- a/model-00034-of-000163.safetensors +++ b/model-00034-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:df4c5f0efee23e96b0420e25a63e266acffba55a72c4dbb23efcaecaee279461 -size 1747417474 +oid sha256:fde2b4cdacc09e9c9af1eda18a1d6995485d9f0c82b687acdbbb37b06bde3e66 +size 3493899088 diff --git a/model-00035-of-000163.safetensors b/model-00035-of-000163.safetensors index a9511a556be58e5c5823198547299fc0de10c386..ec589f22b0ba48eccb19dd92802d079f0ec6bb02 100644 --- a/model-00035-of-000163.safetensors +++ b/model-00035-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:59907496ec35f620146f7e2a771acbae6315b73beb7c9b4484791a5769e92720 -size 4302317817 +oid sha256:141a16e40b4dac1c5db98e497302c6ab61154946109e27905e18380ae5e4815e +size 8598757608 diff --git a/model-00036-of-000163.safetensors b/model-00036-of-000163.safetensors index 7b212baabdd7c5e15f4a950d32ffbf41517e1f92..d7fa9654c08dceb5a9ba0b2320666409e9bfdfec 100644 --- a/model-00036-of-000163.safetensors +++ b/model-00036-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:816a8da951743290c6cc77ee584023fd9063447256abef3937e9d73aed442e40 -size 4302384914 +oid sha256:a47d1a6d602b74c372f48ec0145ae54d5fd422eb51707a65499b70a701f13e8f +size 8602554424 diff --git a/model-00037-of-000163.safetensors b/model-00037-of-000163.safetensors index 63e312b1e079f5aac6fade7537417eea1421fb92..353fc62535e75598077d1f75e2dd4bd129cf6363 100644 --- a/model-00037-of-000163.safetensors +++ b/model-00037-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:03da5c0e525f134c3fb902409a9e737608c38a30710ed489a8e6627b511a25e1 -size 4302350794 +oid sha256:d42e863f615f63606661c72ed90872b04fec2e63015ae6fc6edb16b89bf70f7a +size 8598786704 diff --git a/model-00038-of-000163.safetensors b/model-00038-of-000163.safetensors index f0f0d50d73753c71c6a11f21d8bc75aab6dd1fd4..9ec4b77fec326d53fc27feb1b2cfd53d89288cdb 100644 --- a/model-00038-of-000163.safetensors +++ b/model-00038-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c0e6e082c73bdba9c830cfe08ec9f6424cd83296cae517dfab2338270a848334 -size 4302384518 +oid sha256:40e47b8be093ef3ad52a6792f0203f4a0777fae5812e1cb7774fa001580c4be2 +size 8602554224 diff --git a/model-00039-of-000163.safetensors b/model-00039-of-000163.safetensors index abb75739632a2edaed08db2e5347d0b2a0848eae..9d9cf39122e69f1f38e4fbf2da5eacba21e9bafb 100644 --- a/model-00039-of-000163.safetensors +++ b/model-00039-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a8dba03ca01e579f57e83906aed8aa9f4cd8205f6d32b9888dee455a64896b34 -size 4302384963 +oid sha256:bcd07543e83bde077a87a68c20217e11bf838b16050c04e55e157a2d4b7b178f +size 8602554448 diff --git a/model-00040-of-000163.safetensors b/model-00040-of-000163.safetensors index 048d684eecaeaec546504f74c47fb295469fe025..11a1a0dc8b5645e6a41121bef32a287d88c51028 100644 --- a/model-00040-of-000163.safetensors +++ b/model-00040-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2ebb24adff0b0955375de7ffa071a27381df5dfcef8273b634de47f43199b0e1 -size 4302350602 +oid sha256:36a021810ed2ff68c31b7dfe8c0591d17ac3b120de52656a2477bb3013ae11fc +size 8598786608 diff --git a/model-00042-of-000163.safetensors b/model-00042-of-000163.safetensors index c0603a07b0d8e931899b6117ebe6e2437d203473..fb8011fc2407e8d210919efae42d01d1f130a105 100644 --- a/model-00042-of-000163.safetensors +++ b/model-00042-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9666e834327b2fdc9cb3be9954eda58754c7415dd63ccce449ec1e5e492a5924 -size 4302384963 +oid sha256:baff888ffbb110a28310b2653dbcb73f1e8e0a0b8bcd699e03cbd6571acf49f2 +size 8602554448 diff --git a/model-00043-of-000163.safetensors b/model-00043-of-000163.safetensors index a050dee8617bd4db83f2d1edc63fe97014698aa7..5ecdf905c1437b3af05518d58a051666a89023b5 100644 --- a/model-00043-of-000163.safetensors +++ b/model-00043-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dda5691da3edae3b462c90722d82a345dbb5713ea7d0739c865b09aea593f601 -size 4302350432 +oid sha256:5efb3e13c7f348a4eb1a66e700b671e34a777fbff5da0ebb9ec89bbdfdf45fd5 +size 8598786504 diff --git a/model-00045-of-000163.safetensors b/model-00045-of-000163.safetensors index 6d68b258d64330bda8e9960b71a648d9ebc28c3e..0dab214b7de6d876a4c5bb969f6c4920cad55771 100644 --- a/model-00045-of-000163.safetensors +++ b/model-00045-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:929fa255d58727dae32f88ff5323cb45a9a898e864926341cecac859570114b8 -size 4302350808 +oid sha256:8578984e56ebde02f4e0c2c279f1951a56ef36e2f8beb44232419ef7246979eb +size 8598786704 diff --git a/model-00048-of-000163.safetensors b/model-00048-of-000163.safetensors index 0afb7dbb6ef5d96bda2903ebd1bc2e7e1d0bf844..f74991b461b71e623469efd02a5001a724c3c90d 100644 --- a/model-00048-of-000163.safetensors +++ b/model-00048-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b5dbbd1df4a075642f11f88308c5648e90bafbaf74bece18ae5b77f17f36d905 -size 4302350620 +oid sha256:729fe23e267bac8c1be152d3368dab05af679ce93ecc98081ca83d138409c241 +size 8598786616 diff --git a/model-00049-of-000163.safetensors b/model-00049-of-000163.safetensors index dde7c182f131dbe49ab80fdd713778f55f201c1d..8b72eb11c292230ae5e8e6e7bd847b54fc0dd012 100644 --- a/model-00049-of-000163.safetensors +++ b/model-00049-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:308925e3cd15b67b74e6a3422d3e4667f31fc27eaa8e8669eb439942ee62159d -size 4302384692 +oid sha256:2f60c3173509406d2984070e907c4d10d67665c1927b21cbe1faa641f67151b2 +size 8602554312 diff --git a/model-00051-of-000163.safetensors b/model-00051-of-000163.safetensors index 9b01cd3b774917650d6230f5dced4a077f65e729..3d881ec3683d0f8a2ea78ef390549b17c574428a 100644 --- a/model-00051-of-000163.safetensors +++ b/model-00051-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:68fa813be7c3644a99d38a6fcb8d928e32a9691d1af1b51cbd0ce0afff240aeb -size 4302350448 +oid sha256:c2fdaca8859da0ca440950f0ea17b6bbef9d93c59b6505c483f600d7a117a520 +size 8598786520 diff --git a/model-00052-of-000163.safetensors b/model-00052-of-000163.safetensors index 4b54ee68bc456d8f6d522421675ef37a961157a5..4c4f647edaa63a5bd50ab17d81fd18c9ca3d727b 100644 --- a/model-00052-of-000163.safetensors +++ b/model-00052-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:806f360b5b46495a4f767a4aa9e4a83fceb6cf61415e3b418b714a3dd1411c68 -size 4302384884 +oid sha256:2eee1a7c9dd2c64497cb9bea567908e16762aa6240dd1d16e487ac17d9896703 +size 8602554408 diff --git a/model-00053-of-000163.safetensors b/model-00053-of-000163.safetensors index 17f0eb483b335a2e034a51ccb4d28a5b34daf88f..1c49d18a8d460df68d876f5aa2016835bfc17941 100644 --- a/model-00053-of-000163.safetensors +++ b/model-00053-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9a8867bd41c3afe375ebcedf39a9e2b3793f69e4eeafdcdca8ca8ce9e2f810bd -size 4302350824 +oid sha256:9418b4bb065342dd16f6eb6489c7cfe2fe89a007cfed58ea3a33b7b034116867 +size 8598786720 diff --git a/model-00054-of-000163.safetensors b/model-00054-of-000163.safetensors index bc8dd2f09269409f7217be9c9e35e97da91d5537..19bfb5380be1d7f6ecc5237cd8a3447fed09301b 100644 --- a/model-00054-of-000163.safetensors +++ b/model-00054-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:274d3dd5e855ea3d06f29092c836c7bc628e22ba99fb6ee05520fb2da4b581e1 -size 4302384488 +oid sha256:544f8d00728d025f9ca5425e960acca957ce8b6da62a6b39efc661384566296a +size 8602554208 diff --git a/model-00055-of-000163.safetensors b/model-00055-of-000163.safetensors index 16dc9d8a192bd2530bc27061f2b7cd3f587e508f..93d1be02eb5b2dcf77e2a3b403c033bedda3509f 100644 --- a/model-00055-of-000163.safetensors +++ b/model-00055-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c4978652ad095ae7cfc494932da7b1dd6c8ab14c88c4b847b4ec609f74cec1e7 -size 4302384963 +oid sha256:ef3a17f0b506e08ecd5cda0962c827a46601fab0b62e5b188d8d29b3c73044d6 +size 8602554448 diff --git a/model-00056-of-000163.safetensors b/model-00056-of-000163.safetensors index 539153eedfb9fce829558189452b95ee185b2b97..70658bdb4f9c12145dd2089added1ef52976fbd4 100644 --- a/model-00056-of-000163.safetensors +++ b/model-00056-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:68130d2006590861b30611b7f6d177394136fb8b3cff7d3141bebf28e411227b -size 1747417474 +oid sha256:2fba1235ba7337b35af781580be81baa5c450ed27e6c0ec82820ab366f47aa77 +size 3493899088 diff --git a/model-00057-of-000163.safetensors b/model-00057-of-000163.safetensors index cd8c412a72d75dd532a38339fa5c24285c8f6b74..ef8cc316c5604f876c11cd3828f2463f4ec13435 100644 --- a/model-00057-of-000163.safetensors +++ b/model-00057-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3b4826e9817a96f45f0a5af284c94791549ab681f81f2ba5db521ab15a25938e -size 4302317817 +oid sha256:ca67e8930a61280b8ecd85007931df0adb3c94b6ac5ac2d66060708eaa390d04 +size 8598757608 diff --git a/model-00058-of-000163.safetensors b/model-00058-of-000163.safetensors index 248056009dc053c95eb0b5990b5919dab894cb99..30a7ff9e35309c4018bec8c1dd2b26cc20cc0a6d 100644 --- a/model-00058-of-000163.safetensors +++ b/model-00058-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:80630144922c076d9f0a53b6cdd95d31a3578b90a05f856623afb9f57bcf13aa -size 4302384914 +oid sha256:00f81559432273d6a37df25b2b2f650ff6427a731cf4cb684aa16ab6fa307495 +size 8602554424 diff --git a/model-00059-of-000163.safetensors b/model-00059-of-000163.safetensors index 46ea79000ff8211c4e021738c8e98283f564dfde..c308917794b34b475eeae978ea746c5854b4319e 100644 --- a/model-00059-of-000163.safetensors +++ b/model-00059-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:432a6a2fbb10a36c309924e5129d2b95691939c2d97c5f370d482dfe10f3f7d1 -size 4302350794 +oid sha256:43d9e9e9d7ab44a14fe996210ce4ba1645c7032bebcf50a9bf8c3579832b5ff7 +size 8598786704 diff --git a/model-00060-of-000163.safetensors b/model-00060-of-000163.safetensors index fef7bd2d99bcfbc22f994707148cfbbcc929d803..53e77683a0e9e4256ee92c5f74ad175091f596be 100644 --- a/model-00060-of-000163.safetensors +++ b/model-00060-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:59f81c7cef16c0474d9695c17bb70ad8cfd99f7213aa939964294d807922a2fb -size 4302384518 +oid sha256:2e29796d278ec84e6b92c785123377b79b591dc9686cbdd8c9527eb7685e2cdf +size 8602554224 diff --git a/model-00061-of-000163.safetensors b/model-00061-of-000163.safetensors index d5aaa7778de9c0097e03c39289e9069104c239a9..d733ce8c4fee6db5cbf58193f4983d77756ed1de 100644 --- a/model-00061-of-000163.safetensors +++ b/model-00061-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:69cde84d3893db464497ac2894ae6128f8c058fd02f74d1c23afd0a2a93e2adf -size 4302384963 +oid sha256:b4c653fdb25e876ca92a18d7ef765676c2995879fa4a8028097acf61cc4c86bf +size 8602554448 diff --git a/model-00063-of-000163.safetensors b/model-00063-of-000163.safetensors index 725c402dbdf106069b491ffa478375ed51973a8a..f702b4aca67d69192b5b1507aa4ff8174fa6d45a 100644 --- a/model-00063-of-000163.safetensors +++ b/model-00063-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bf0f5c6e778fd299fdca261d1d2df72cbb93f1465c0de22cea2e6bbfc52554b6 -size 4302384710 +oid sha256:6bbaa706b11dd27c63ae40a4cf8e76c43f6e380d5108732873104baf427e4313 +size 8602554320 diff --git a/model-00064-of-000163.safetensors b/model-00064-of-000163.safetensors index 89bbb9b40334ff1efe86fffe3bfc45c7eeaa27b2..59210f507909640b1fc77d4c8f34bd4f4461c521 100644 --- a/model-00064-of-000163.safetensors +++ b/model-00064-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d99efa8b327f7fc4929798dfa3bafd04fb5c036915919a84e268aaf25e67424d -size 4302384963 +oid sha256:d365ca541720187c6e1b11569d39d9f9ab4eb110ed8708ef4d23f8df0e82f6ce +size 8602554448 diff --git a/model-00065-of-000163.safetensors b/model-00065-of-000163.safetensors index 07a3cfc32d9c71a5a6e7768e3449ea800d589c75..28bd8470cbc702fe0bc8d49ea9cf19228801d313 100644 --- a/model-00065-of-000163.safetensors +++ b/model-00065-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:898c045b5e0602e2a496debcec20396a824310b3107f1c4db6214ed6a3c1ac79 -size 4302350432 +oid sha256:afc640828ab09a86ee4fe1a27a029a2b43dbacea5466fb207879a5c111e1cfe6 +size 8598786504 diff --git a/model-00067-of-000163.safetensors b/model-00067-of-000163.safetensors index 1e4468bfcd27ebba9351bd4e1d9ee33a92e3645c..d7d55814c602f6b9192583bd0b3aafbfe7e09eea 100644 --- a/model-00067-of-000163.safetensors +++ b/model-00067-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f0cbc915d403f7ae15744735b33e1ec65b53c7ebc2c2ee487481bd4fb6d111b2 -size 4302350808 +oid sha256:b312720a67ea077994ab54f513f3803d5d2c6fe835018cb31c78048f4f375090 +size 8598786704 diff --git a/model-00068-of-000163.safetensors b/model-00068-of-000163.safetensors index 526f046b3e1bfcea7c16d9a0b4c3d60e451dfe12..10353f681552b02f76de67bd86af6632aee55459 100644 --- a/model-00068-of-000163.safetensors +++ b/model-00068-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2594adae97d7a675fc785745101a1d66f007b43894fddd80440ced78eaf77e98 -size 4302384504 +oid sha256:71b6fd74acea607aed6ded74baf41e6da2f68b5f83031b7e74405406d4d0d3b4 +size 8602554224 diff --git a/model-00069-of-000163.safetensors b/model-00069-of-000163.safetensors index b21c6f9fa4e63af46280feb9e4dfc0b096c8efb3..0fdeb639e65ff07b4f5381dee583b3136a4c0caf 100644 --- a/model-00069-of-000163.safetensors +++ b/model-00069-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:01daa8eb84a97158ef325a1f34dbfbb29c093845b22e6dca560e4def807586df -size 4302384961 +oid sha256:49fafa7b8b37d2a3cca49ecea1da377db15576442e106141c4fc350471545cc9 +size 8602554448 diff --git a/model-00070-of-000163.safetensors b/model-00070-of-000163.safetensors index ee8e69dbf164bf2dbecdf26ba1440219b928d2bd..4aa29c0840467d591bedc41b8e327e6be585f527 100644 --- a/model-00070-of-000163.safetensors +++ b/model-00070-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1f0368ad214afaff4da8e61c2b84a237a91a369c3ad0d95daae38ca75b0d62b3 -size 4302350620 +oid sha256:5a29a8089d825c4e9e3b668140f4ebf7b64aa94841aba84028f3fec07602e957 +size 8598786616 diff --git a/model-00071-of-000163.safetensors b/model-00071-of-000163.safetensors index 98c9c4b48e78211425a9774826fe65f8405b1040..9ca3da55dbd22bbca957f30f51ba9e9556cb4798 100644 --- a/model-00071-of-000163.safetensors +++ b/model-00071-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0cc594400988bb846804388cd6c76496bf8ed0ccf975ebe85ba00a310532a59c -size 4302384692 +oid sha256:34695e3ca5626c4f1672ef6ee46416ed6fbea43c88c525c3913461dcb772eced +size 8602554312 diff --git a/model-00072-of-000163.safetensors b/model-00072-of-000163.safetensors index 7c748f207b51c83a662cb0190ba146f6aec38562..2fbf743501232b0b922d51d4879390c2e88b0e9d 100644 --- a/model-00072-of-000163.safetensors +++ b/model-00072-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6940c2e5c775b3d688aa8e6f25ffd22e40d089722c3085b5f1e0976ac23b4f9b -size 4302384963 +oid sha256:c5823d2f5137b3377511bf9cfa1402921afbe2a28fb4991fac3fb020d33663dd +size 8602554448 diff --git a/model-00073-of-000163.safetensors b/model-00073-of-000163.safetensors index 804dbeda9b27402c1747b9e0dbc2d66b41813744..868815711fb6f7e69fde97f38d08321561aa83f2 100644 --- a/model-00073-of-000163.safetensors +++ b/model-00073-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:3fc8ab4be0f4a284849e144c07173db39f5ed8d4e4d4838f2442f3d580d0356e -size 4302350448 +oid sha256:ca90078c16bba9970c99664dfddfdbf70b51d7992dca77ee3921b58b2d30e09d +size 8598786520 diff --git a/model-00074-of-000163.safetensors b/model-00074-of-000163.safetensors index c7ff1bfb8134ccc53c2e7e008ba335dbe114921a..8c03ea60885263d9d7e843397d57cb8b0d233156 100644 --- a/model-00074-of-000163.safetensors +++ b/model-00074-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9651fe2a556d41002612ecafb595fe97801e6cc2f22519ee9f64fbac9cfbc704 -size 4302384884 +oid sha256:7bb028a802296f054728c5de25f548428bbb043b26cc00140a3e99eec4655962 +size 8602554408 diff --git a/model-00075-of-000163.safetensors b/model-00075-of-000163.safetensors index 801babaca3b2f5cc41aed26aa397027935312f8d..38b38aa1b9c09b93dec19b61de4c9b10e9a5e4e8 100644 --- a/model-00075-of-000163.safetensors +++ b/model-00075-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f74e66e34acd6e3c61d1e90bbbac335c24e510720c33e44d3516803f38a518b0 -size 4302350824 +oid sha256:93778a5ccad8a1d56e659a9e40811351da9bc48563d4c112ccfa431ee9d5ac14 +size 8598786720 diff --git a/model-00076-of-000163.safetensors b/model-00076-of-000163.safetensors index 7318765531d96220ff7da4b6cfc951ae91ac3a26..b221fc15b13251a15b0801837c48f6d321368f3c 100644 --- a/model-00076-of-000163.safetensors +++ b/model-00076-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:986f6a11367f1b56006a8d332c16aac4e4b81ab29d0606b5e4cb4a00a01224e4 -size 4302384488 +oid sha256:426e6c32054da78a9a829fc88d3d6c67388ccd774eed360f99d042835911f5c4 +size 8602554208 diff --git a/model-00077-of-000163.safetensors b/model-00077-of-000163.safetensors index ef813402734e998ce8362df4fe92dd1bef79e85f..b5452de74665d8a4b0fd7737094d2d59556fc1e3 100644 --- a/model-00077-of-000163.safetensors +++ b/model-00077-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6b0e946a0d1d06087bb470f67208f1213c2a4ce47ca6fb56b7d31df9a27e2dc3 -size 4302384963 +oid sha256:efe737747edbdee62a1f2d4bec668094e4d037c0ecbdd4680ef19c67a0dc8444 +size 8602554448 diff --git a/model-00078-of-000163.safetensors b/model-00078-of-000163.safetensors index 7fc7bc2ba57461e8182f74eb0af6c2cd8b544d40..c7c1de2f319f9b3ac0cb7f18fe70be3834ca9459 100644 --- a/model-00078-of-000163.safetensors +++ b/model-00078-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9835f6d79440750c5cc4b90b5f8c85a0dab9fca47cb549f9daa4afe5b0641d76 -size 1747417474 +oid sha256:c84a59f671f8ff2d401df72fb3af589f7ffcc57d6e5eb3bb58fa03cb0910c869 +size 3493899088 diff --git a/model-00079-of-000163.safetensors b/model-00079-of-000163.safetensors index ed54c4a161bbdbe8438645e300281312a799faf0..849c0596a2e3fb6c987f024a82b1a181d53085aa 100644 --- a/model-00079-of-000163.safetensors +++ b/model-00079-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8dfe2c6835455e683a9ef645217be5cc9e9a387027c1e89e443f5118a47a0303 -size 4302317817 +oid sha256:ed106d9523ae20496e9ea34decba0c8ebcb941d34daf2ab40d306b731ed19e73 +size 8598757608 diff --git a/model-00080-of-000163.safetensors b/model-00080-of-000163.safetensors index 8319df971cd47fb17b702c8852a91d28f75c86a3..d62f3fc368fa3364d65ad43609e049510702f76a 100644 --- a/model-00080-of-000163.safetensors +++ b/model-00080-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5afc8aa8b94c7291339887605bbe3943258aaed182885603b4027225d9894bd8 -size 4302384914 +oid sha256:e1a0bc5c3236d449286d2f943335dc5c174bbc6b10c8b2da12979bd106427ab2 +size 8602554424 diff --git a/model-00083-of-000163.safetensors b/model-00083-of-000163.safetensors index 9503cfb09c3cab46a5ed4e86439a28b11e0e2f73..e08ebc2c287541f2c47749b29d794d97eb5053bc 100644 --- a/model-00083-of-000163.safetensors +++ b/model-00083-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:095348fdecd55d4d4f1d16ca143bfdbdbaf68ca2da5d7cd401a2e23f44991ead -size 4302384963 +oid sha256:0c9a509083fd66cff7caa7dbafb25622e51b74b8617d048497c305cf79727d1e +size 8602554448 diff --git a/model-00084-of-000163.safetensors b/model-00084-of-000163.safetensors index 121b6e1878af19afbdaeef043fc47218df87fc8d..26d546a5ef25076534aad8ed4364d5c807ebcf18 100644 --- a/model-00084-of-000163.safetensors +++ b/model-00084-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ffcf0052d53fd36d1eb00b0377e297209d4f8497cd79a78c5d683e7ae6625465 -size 4302350602 +oid sha256:40b3bfe0944d0461fba80e05adeddbe80eac80fd5d692158637e18604535d32f +size 8598786608 diff --git a/model-00085-of-000163.safetensors b/model-00085-of-000163.safetensors index ec4e8766b82d93800843dc879653aba64dcc2667..bf61fc588a2a433730176e2956b1137d1e62c0d7 100644 --- a/model-00085-of-000163.safetensors +++ b/model-00085-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7b210ddf71720212cfc0a08360c97aeff96b33e29374f661eb740eb94f06cec8 -size 4302384710 +oid sha256:8fce3179ce0ff5c3647e31215fe8e0d4e8062cd6016b3d3201faff43f45881fa +size 8602554320 diff --git a/model-00087-of-000163.safetensors b/model-00087-of-000163.safetensors index fde7642e95e65f76fa1b15ffff750fe2f799bc61..f7b89be3faa181f2997e0c05cf00056bdf73db68 100644 --- a/model-00087-of-000163.safetensors +++ b/model-00087-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b89cf8ea275ad45b5e40fa215e4aaba099209bf9ba467f978c82f26b009c73cf -size 4302350432 +oid sha256:0a47be2bc55e4e42ecca6c0d9dffe201eeb9487460a1bdd43778eb4b54034e9f +size 8598786504 diff --git a/model-00088-of-000163.safetensors b/model-00088-of-000163.safetensors index 787d937cc9e76967ef66618162954ebe3d922846..10da81b6f1c2db61b0a2067929d760f27c79a8b6 100644 --- a/model-00088-of-000163.safetensors +++ b/model-00088-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7219a03969a16af8f722f5a7df6f5e2ad51e19c86fe34a2c841d2b9b0800d8f7 -size 4302384900 +oid sha256:d9fa51dea4930088b90e910e76097bc5c9e34ca00f826082107d1ad395a1825d +size 8602554416 diff --git a/model-00089-of-000163.safetensors b/model-00089-of-000163.safetensors index 14f8c146e66561109a5c1ce771a3c1ccb0ea37db..39c8a27048b2dc247606d2dc47038b69b51d29e2 100644 --- a/model-00089-of-000163.safetensors +++ b/model-00089-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e57eef5e6eb8fe1616dc3414321c75b8e4e9147579a1ff0467c8fbba592f27aa -size 4302350808 +oid sha256:438fb205fe973b4db853c56e48762fd929c151474757f4627d8c6e71e23f9ca1 +size 8598786704 diff --git a/model-00091-of-000163.safetensors b/model-00091-of-000163.safetensors index 61f087157f5d5b729cec9b953258c55d57cb9ad1..95b198c13dbcdffc6420c456f053dd1d4d14c4f1 100644 --- a/model-00091-of-000163.safetensors +++ b/model-00091-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a2c5d3f066131af8c6e4e225f7bcdbb17d72f7e798492dff43ac0e73ea53363e -size 4302384961 +oid sha256:4b57478777931d0f588ea7b201122b5f18c1c9b81417ab4bd1ed2d20502360c3 +size 8602554448 diff --git a/model-00092-of-000163.safetensors b/model-00092-of-000163.safetensors index 8b26c7daec3a59f73af5165bad1ff415f4245342..bd744bc2fe40f7756e44628282fc691f9b6c11eb 100644 --- a/model-00092-of-000163.safetensors +++ b/model-00092-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f9e99f4a974577f34312906924a64a500af8f6275bee21e4015eb09bbd5415a4 -size 4302350620 +oid sha256:fe0d3b8dfcdd12e92f3e7722e792e142878dd4bf5a9635195e1c04e2dffe6581 +size 8598786616 diff --git a/model-00093-of-000163.safetensors b/model-00093-of-000163.safetensors index 0704f1ac2957462b593cd45046e96e9d95f3d447..fca1d349a812c947401036c4742372fa6579925e 100644 --- a/model-00093-of-000163.safetensors +++ b/model-00093-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:bc7300167ed6f5e603c43d1aa87bfa040d60a2a103ed57162ac08f682cb75974 -size 4302384692 +oid sha256:812f9070f62451882ef5f112d01be34268365364636ea01ea41fc07638881115 +size 8602554312 diff --git a/model-00094-of-000163.safetensors b/model-00094-of-000163.safetensors index a31523799889f528e12a0fa706b47daba93e3f07..076c733d5bf6a43cf66e6e001da74604346c4dc4 100644 --- a/model-00094-of-000163.safetensors +++ b/model-00094-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6cb0e4055409ecc754dd058e2d350039022d43f4ac1840825a41eae71cbb1a20 -size 4302384963 +oid sha256:51db107874601bbcadbbaecb29af71901b422fc83fe423102823f02550a67d51 +size 8602554448 diff --git a/model-00095-of-000163.safetensors b/model-00095-of-000163.safetensors index 066a8fbc0c7a00793d42e21a90fd6fcc3acc5bbc..e9f0b7cca14b6ce6a942ea6744b458e219860dc8 100644 --- a/model-00095-of-000163.safetensors +++ b/model-00095-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f1387857bd9d101cc83527b95a9945719b0b9484d77e966c5e3d9e8272f8d89d -size 4302350448 +oid sha256:3c37f8e321e95bc12c8f64f6d4921f225b68883aa3f8a7d6470af82cd0b0a929 +size 8598786520 diff --git a/model-00096-of-000163.safetensors b/model-00096-of-000163.safetensors index 79b90f163d57cd537eb21a928885e6c98c4d036e..a95f20425758999c6037085dba5d4125746a8377 100644 --- a/model-00096-of-000163.safetensors +++ b/model-00096-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:b58d7c50e54b8957e2b620c57016e3c6087f2eaa18f8572bdd8d3606511bb4fa -size 4302384884 +oid sha256:03c7de49d3a5a2cff8b514f8dd728395561eef014dd538f63f03a3b9a8373c8a +size 8602554408 diff --git a/model-00097-of-000163.safetensors b/model-00097-of-000163.safetensors index 30120948aaede702ccaf86367fb53146a9857bd2..13c2a2f60a28853c9fc6cb7d1433072e98a9e5ec 100644 --- a/model-00097-of-000163.safetensors +++ b/model-00097-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fa678aaed884639512b36c1ecd4620d01af7f45b4244d730961f4d08806207f2 -size 4302350824 +oid sha256:b69539d9e034375e10c94e5d9b3e9be89a9ffabecb920af6c7416d06e7a765f8 +size 8598786720 diff --git a/model-00098-of-000163.safetensors b/model-00098-of-000163.safetensors index 7bdd20a2fe786303a801b654fd5db3465e9f3125..b4684fa7021fb04a3d9a2f9e53b3f9b2761a5e61 100644 --- a/model-00098-of-000163.safetensors +++ b/model-00098-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a2cd517b56750d4f5791fe30b951da61a6f9235baf71811019b1c4228b5ee934 -size 4302384488 +oid sha256:1cef330169c2974ca270d9c8489d0100a5eaed839cd701bcc52677488534477b +size 8602554208 diff --git a/model-00099-of-000163.safetensors b/model-00099-of-000163.safetensors index 2055ccde45f61d399fb5ef3c304913030b5c2156..9e612e0eb2091e7e9be4fb4255fa9074df9086d6 100644 --- a/model-00099-of-000163.safetensors +++ b/model-00099-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:06d5aa90ee2e7cc83c42abd109f1abb92660b96abbb0514dce3f14f36b968624 -size 4302384963 +oid sha256:93c869482aac8e034310f933a37540234a33d70059a859bc3e4d53ec037d68c1 +size 8602554448 diff --git a/model-00100-of-000163.safetensors b/model-00100-of-000163.safetensors index ffaa5e3069e8e5547a9ed13c30f65aa956bd5c72..8565c04de44a88b4dbfd0f8fe39e0ef07c997a49 100644 --- a/model-00100-of-000163.safetensors +++ b/model-00100-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:90e85dc99298fe2e4933e6cbaec263c03a0cc048c2936231a920b2dfa90b8258 -size 1747417474 +oid sha256:bdb3914a6c94e69bd36613f0857e956566b24fa2478cd91995d62390b8a33de0 +size 3493899088 diff --git a/model-00101-of-000163.safetensors b/model-00101-of-000163.safetensors index 00816279cc79c2221df1d357f12c6258d9507b04..570334ff85609d87fc65e84152529cda03ed4136 100644 --- a/model-00101-of-000163.safetensors +++ b/model-00101-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9976dae2a44b4407a3a39dc69104ccce67001a307b1b49e966c98ab246b371f2 -size 4302317817 +oid sha256:2e2760eec1c139dc1f11d9b98fe72338a52fd37419b2607c291d434a3313692e +size 8598757608 diff --git a/model-00102-of-000163.safetensors b/model-00102-of-000163.safetensors index 63c239b3dac889404be8f0a08c65bd363979383a..24c7193d500e86932b2ac1cc347616d2928b0450 100644 --- a/model-00102-of-000163.safetensors +++ b/model-00102-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cf36bd6e7a27d2f0a41f2e5387e2be53918fbfe4c886952e2ab55bd96b56c23e -size 4302384914 +oid sha256:1ac5c91acddd7671ef984c2decede61fcfbe6af480968c9cfe494bc2b78015ca +size 8602554424 diff --git a/model-00103-of-000163.safetensors b/model-00103-of-000163.safetensors index 4bdb3b66eb262b00b2850d86c136f88c9e20a530..ded66fd42a358b1aedfe4a729145bcb22091c92a 100644 --- a/model-00103-of-000163.safetensors +++ b/model-00103-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:f8e08c2159b56b25dbdb1800897729f5f0bc11b8c07bc660f031e4d6a9af09b8 -size 4302350794 +oid sha256:73eb9c69a7d26eb510f0678ad5a359d34047093b1b38b8ee07ac8831555996ca +size 8598786704 diff --git a/model-00105-of-000163.safetensors b/model-00105-of-000163.safetensors index 5e5034e1340caaa224762020474b3484ab292c42..1cb7f8a62973b5178ac8c0a06fa6796149987206 100644 --- a/model-00105-of-000163.safetensors +++ b/model-00105-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5541411c798dbce3610e56b1a0d4c21fe8fa4cb35cb82b4c8888942305d812ba -size 4302384963 +oid sha256:51c723ab40c000e28f98fc8517297ce4755bf56ecb5f1a37b083eb1d5937e295 +size 8602554448 diff --git a/model-00106-of-000163.safetensors b/model-00106-of-000163.safetensors index 321c85bc089b2cb1636203eb779af30c213278c4..4e99bbf503f2160dafcafa02bcbecf1afce60e9b 100644 --- a/model-00106-of-000163.safetensors +++ b/model-00106-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5a2d163f3ca1eeb85e35a44ab6d162af6a6f531186b1a50221c13d2c1254c0be -size 4302350602 +oid sha256:c09fa4d90df379998484ba098d096dc2dbf09a473d29f17b6d6c902275de4ca0 +size 8598786608 diff --git a/model-00108-of-000163.safetensors b/model-00108-of-000163.safetensors index 9a773aab92919745b04c4fe39e82ca7b3d4a57da..20c512c9cd3504fd9cc813589f83a78d3ac39e64 100644 --- a/model-00108-of-000163.safetensors +++ b/model-00108-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2813892afb5bea5b3375e03e5c2474f7828078a9e35ffdcba01a710193477ccd -size 4302384963 +oid sha256:7dc5081c01628cd9f18079a4150e939ac00b0679e832cae1c3a3c4561e76b4fc +size 8602554448 diff --git a/model-00109-of-000163.safetensors b/model-00109-of-000163.safetensors index b7c612356292ea7194ab666eb7f3306b69f9d8ee..0b1daaec51fe29825dfd4ca24f22cd80a93053e4 100644 --- a/model-00109-of-000163.safetensors +++ b/model-00109-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:70b59cb0fe6e89b982b64be838543e9387acd9d597299347e9852962f0866eed -size 4302350432 +oid sha256:fd0a84f7c0ecac01732ae0d0689482a0405d3885ca8184d0e7e832282a5aa114 +size 8598786504 diff --git a/model-00110-of-000163.safetensors b/model-00110-of-000163.safetensors index f8763a741baacf8c64e95ddca568bc996ed6214a..fd2d581b6e4353083566866064f3e2abb1046785 100644 --- a/model-00110-of-000163.safetensors +++ b/model-00110-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ce860b0acca56cf2903c322983e58f74829d30c26c6519f50fc8f90b9c3570d8 -size 4302384900 +oid sha256:ef9a72aeefd1d5f4b8b324a853acb001f16432fdc98f1cf8f24abd3901aab4db +size 8602554416 diff --git a/model-00111-of-000163.safetensors b/model-00111-of-000163.safetensors index 5c6743baffb7d83eab24c50f31cba514c1ae0897..41cb7848013fc5138fb036344d1e29978e8b262c 100644 --- a/model-00111-of-000163.safetensors +++ b/model-00111-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:912c0c99c138a314070f6534af23149a84dd7eb53b419808010fe5fa0f7ed066 -size 4302350808 +oid sha256:410ea3087bf083787ae185e0896f5195b437ed77cfc9c3f3626f5060792d4d28 +size 8598786704 diff --git a/model-00112-of-000163.safetensors b/model-00112-of-000163.safetensors index a2c9fc013664dfb24ed5696dbb5541d75797f945..fa7d33a6bdf86f2feceeab332f3ab08f210f729a 100644 --- a/model-00112-of-000163.safetensors +++ b/model-00112-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8d9989812d88e027e7bd02ba1d19e61fbffb40ac05a0a7775eb82335a429d457 -size 4302384504 +oid sha256:43ac50ae4b9fb4851730f9c7b617b4383c96f58cf6427382f0b44c007c5df3d1 +size 8602554224 diff --git a/model-00113-of-000163.safetensors b/model-00113-of-000163.safetensors index dab65fcdb080804e625afde6f13ccf9234957843..e5c4dbeed6f4dd4df0a37e8e06743dfa628c8d08 100644 --- a/model-00113-of-000163.safetensors +++ b/model-00113-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:02c14d13f644dd148d038632610e300627e4bc4b4a0f81b73c209d29c4a36f89 -size 4302384961 +oid sha256:d562c0e1509e03d8c7f0809f0899ddb505599dc39f059c49a90931c357ab5cf4 +size 8602554448 diff --git a/model-00115-of-000163.safetensors b/model-00115-of-000163.safetensors index 87674756728567ad077c64566fd542804769eec0..3d7c43a404b203e7d03e58553fa4a47ca91fed94 100644 --- a/model-00115-of-000163.safetensors +++ b/model-00115-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5a66f0fde0ffcf4b69f044c8159a85171153c41327ad7ae0d9ce1054c203b505 -size 4302384692 +oid sha256:24095dd8a22ddae161250c9e44425e5283faf3804c3e8923ba2621e7bfe041ff +size 8602554312 diff --git a/model-00116-of-000163.safetensors b/model-00116-of-000163.safetensors index ee85ef62b148eb0a49375ecfbb04e3cb02758206..f1435bbeb8668021fd09c3e4442a7e2f43685243 100644 --- a/model-00116-of-000163.safetensors +++ b/model-00116-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1102daefb72e32625becfe1ad290ff818b779d73649c7ff9e315a7e2de314bd3 -size 4302384963 +oid sha256:b6155fd3ce66875d52c287aaaf51213fe9bf79914d33dc1017d0029679dbaaae +size 8602554448 diff --git a/model-00117-of-000163.safetensors b/model-00117-of-000163.safetensors index bd0ede0db9a934907c53dba9f34a29a06f1a5962..fd5e9c7b6193c6b6066b4f4e6468ddc8cd4bd6f8 100644 --- a/model-00117-of-000163.safetensors +++ b/model-00117-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d92157af0d4af8ef953cf7fb6e0b38b406fb7c4b35bdab01be2a2eddf450407e -size 4302350448 +oid sha256:0b4e3fc95afafb6df6ecf6efb6339e7186d3df1bd2dacd3b5bafbe3dbaf044d9 +size 8598786520 diff --git a/model-00118-of-000163.safetensors b/model-00118-of-000163.safetensors index f0ad49de593545a8a4d28132fcc6fb148ffe259f..97f0c10a589208048185289074f99d155ab6cf99 100644 --- a/model-00118-of-000163.safetensors +++ b/model-00118-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ba30d60916a77c4ce013cfbbcc453377b70c2a75ef0456a4458c9ca547111993 -size 4302384884 +oid sha256:2883e9361ebdc25998f323655be8ece6a3387da2c96daf5c48b860483e515c31 +size 8602554408 diff --git a/model-00119-of-000163.safetensors b/model-00119-of-000163.safetensors index 2cfb7b74c6a526e4fe222b02bb27cf7b20b3fcd9..67073bd72fe4eece32a0cba81440200a98f6b264 100644 --- a/model-00119-of-000163.safetensors +++ b/model-00119-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8938205f9d550a945121f153beb9c9c8f169eafddfc56621cdb6235e011ba294 -size 4302350824 +oid sha256:d7cbfa4c05ae201e498e881ba9d449c7bfafecb6bcdf492cfc079bae56fcaf2e +size 8598786720 diff --git a/model-00120-of-000163.safetensors b/model-00120-of-000163.safetensors index 2cbda8e89101e67effc4ed10ce8ae47141ab23b4..314cec8d8f734958edcd5954e5a6ee4ea72dd4f1 100644 --- a/model-00120-of-000163.safetensors +++ b/model-00120-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:18fa9b624779af7372e26ef79096b1ca341b3ff2be616d11bc3df2cf07387a33 -size 4302384488 +oid sha256:777ef60a2bf8130814576bce8f45c5f77ca3226a933aeb4eeb717cf3a5d7514c +size 8602554208 diff --git a/model-00121-of-000163.safetensors b/model-00121-of-000163.safetensors index 575c1dd3febc5e77e5500fb092085ff6842fcddc..1dce9bfd85e192a2a49fa552dcca855bb2a2d30d 100644 --- a/model-00121-of-000163.safetensors +++ b/model-00121-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:669570df0b213487a0f0cd1f8845fac53c9c19c942dd14d3a42c0ea97cc28c6d -size 4302384963 +oid sha256:bf17a7dac40774827752693bff5ee1630b59e65edd1d00f9e3a49dbc461aa86c +size 8602554448 diff --git a/model-00122-of-000163.safetensors b/model-00122-of-000163.safetensors index 941f2ba8f8d59caa7d894ccf407fe3e69a61cdc5..e15a2a5ddc25b172399bfa91844c47ff78e36aa8 100644 --- a/model-00122-of-000163.safetensors +++ b/model-00122-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9a9a82578c3a7e6bb45f36fe41e7922d777787bf45c767c02db9897b21ea8354 -size 1747417474 +oid sha256:b99d022aac3274bee416eb456e9d41efb7d9d3d8b0ad586bed48ff2e8ca4fdd8 +size 3493899088 diff --git a/model-00123-of-000163.safetensors b/model-00123-of-000163.safetensors index b90cb3cd52413e10ca7298c12919f3e80e4e5533..ba3af32ac03f146937c2c481e4c7e170a3ebd2eb 100644 --- a/model-00123-of-000163.safetensors +++ b/model-00123-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:84723e0f5c3f520e83b75f73318f9f7ddf43702893ae138e9fc560410f674f46 -size 4302317817 +oid sha256:0a32c24ff8f857e2a931ad520063a67ecd9bd1a7a2ab59bc11740e0a46412a48 +size 8598757608 diff --git a/model-00125-of-000163.safetensors b/model-00125-of-000163.safetensors index 7f1045bd882bb050fa664ebbdddd6b7745e9f02b..f48e2b0b4796cfffd37d2d6a435ea7344dba623a 100644 --- a/model-00125-of-000163.safetensors +++ b/model-00125-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:562c9706e1b17d25916b4929f2210c489cf6f8b0311d087e0c851fbcddf50607 -size 4302350794 +oid sha256:e3a8dd78fa8e2e08e16c5a535938162fc15f64724ac24e1b5d0128e016a70451 +size 8598786704 diff --git a/model-00126-of-000163.safetensors b/model-00126-of-000163.safetensors index a9121c748189a58506f7d363f613f84b97fa4dda..738f93b8da69f76a7d72b661c837fc5fac1aa1b3 100644 --- a/model-00126-of-000163.safetensors +++ b/model-00126-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:949da3c082f9aad8c2e03e7b1f26dfad76716f85696d889cd21feb8ae6818c63 -size 4302384518 +oid sha256:b8844009f6f3fa302aa120e165485d97cacda5cf4239256e375b41c620f68c11 +size 8602554224 diff --git a/model-00127-of-000163.safetensors b/model-00127-of-000163.safetensors index 9b08478bd9694a0378b41eaa9e5bdd44e7d41f1b..7cbb77b725032dcb472baf10248ce5594ed55000 100644 --- a/model-00127-of-000163.safetensors +++ b/model-00127-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8871e7ca5651392dbdd9a5e66e398c284fc1c7111d496a2143ff497fc82b7741 -size 4302384963 +oid sha256:f70e1b38623fd279710f662e542ab42ee68b63f88e2ca47f427d7b7040f2075a +size 8602554448 diff --git a/model-00128-of-000163.safetensors b/model-00128-of-000163.safetensors index a24a13b8afea6646c866a7c60a37cc98c55a4436..02e4bf298db4e6daafb0d0903d73b76376068a52 100644 --- a/model-00128-of-000163.safetensors +++ b/model-00128-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:cb8a5a4d53a670bf283791a2f07a65ce75b6426da3d2480f8dc650124d8d0edd -size 4302350602 +oid sha256:c3e7b467abc96c76ddd8a41dd91d811d73e2482c748e2fc6cdc7ee1e171797fd +size 8598786608 diff --git a/model-00129-of-000163.safetensors b/model-00129-of-000163.safetensors index c5b49d853475abb588e3817e3e59195c1d347e01..38a701c8850d09116535f49579125bf4dc7c5f5b 100644 --- a/model-00129-of-000163.safetensors +++ b/model-00129-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9a49ccda2e63b822be58c50320b89767108c81883fc42d13d52042e2548caf53 -size 4302384710 +oid sha256:909f51b71066c9de541a6d99086a23f3c19975fdad5428325c7c7b33d6b17b1b +size 8602554320 diff --git a/model-00130-of-000163.safetensors b/model-00130-of-000163.safetensors index dd7db4a77300d4b95c7a17bec1828659913d5f19..d86731044df2733a008e87af357d9b6506449206 100644 --- a/model-00130-of-000163.safetensors +++ b/model-00130-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:00ceb885b7ada31e130ba2faa47ed18b1e4a3e020ed0971a49b86f02d2933aec -size 4302384963 +oid sha256:f68ec4959cbcd33a675d600cbcabe761f1ecf440b8611d9329c0e43360073fa4 +size 8602554448 diff --git a/model-00131-of-000163.safetensors b/model-00131-of-000163.safetensors index 6985b01f92de96fd2672e59cdea5354d5f755c1b..8794b4f16323f412fd2b5071fac552888a1543d1 100644 --- a/model-00131-of-000163.safetensors +++ b/model-00131-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2af936134d19252994e75178f70d68c2381393f698224bda38af657efdcb7b94 -size 4302350432 +oid sha256:912cf46b37618c353deceabfddae3dda571e4b5e20b1bb02cee9821af0387bf6 +size 8598786504 diff --git a/model-00132-of-000163.safetensors b/model-00132-of-000163.safetensors index 3897b7293dc389079550de0dc8c4fad78564e9c3..8822e0fd062d3fde9dad37d63fd058e3e39d92de 100644 --- a/model-00132-of-000163.safetensors +++ b/model-00132-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7ceabb5bfd0b48f6617d94ed9d4b78ee037ea56c907937addad954eb98e61b6f -size 4302384900 +oid sha256:cef14487076e7f4667646e75ee7684af76ca242d3d274fb0f6e3d27ae143e1c0 +size 8602554416 diff --git a/model-00133-of-000163.safetensors b/model-00133-of-000163.safetensors index cd15bae8d5ab7dddc2d5f7e00e13d9abf2930997..676b3a6d7952990a2b410b2ffd9440552a9b4d90 100644 --- a/model-00133-of-000163.safetensors +++ b/model-00133-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:213c0ae67ab8576f70eb9b45430de11bd20a37044e28b1974cac58fc5d11260e -size 4302350808 +oid sha256:09bb1c6c25d17f1e5a3ccdec2420dac338e073e62489f98dc85f022a889a0ebc +size 8598786704 diff --git a/model-00134-of-000163.safetensors b/model-00134-of-000163.safetensors index a6e91905784aa102d2e72e843ad31fd76b14f3fa..52be002db2a94e8e29ce9605da9467b7dc956c1b 100644 --- a/model-00134-of-000163.safetensors +++ b/model-00134-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d2cd64a8c397d2e333b84f1475312245a82455d1183641936caeec6acd7794f7 -size 4302384504 +oid sha256:10ec4cc7280fde28911cadc7e6605249ae6c77954434cbe20140cb13bdd7a5e5 +size 8602554224 diff --git a/model-00136-of-000163.safetensors b/model-00136-of-000163.safetensors index e6f77937d9a68139b92ea8eaae857defe44677da..cf6cb95b68fcdb89e41d4d6c4bc3b53c8e06d358 100644 --- a/model-00136-of-000163.safetensors +++ b/model-00136-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ca04d3839513a925bdcf18a805ceb8b76a5d8e0adabf36f685f18f42933d7b62 -size 4302350620 +oid sha256:265be47028b3119ec0ee0afb258340b68cef757ee65c66479dc96056594b5be3 +size 8598786616 diff --git a/model-00137-of-000163.safetensors b/model-00137-of-000163.safetensors index 8e80c2a38022f2c733130acaf684d4b2c1831f64..d061c4cb1d144664f91a30fbfeecfa65bb1e01a8 100644 --- a/model-00137-of-000163.safetensors +++ b/model-00137-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c45464fc9beebb881ce5a726e8db9fb71c66c8362536866a3e4a081dce664cd6 -size 4302384692 +oid sha256:942888041af0c6a0e7840a66af23958760b6f7493b240364fb0a319902bbf3c5 +size 8602554312 diff --git a/model-00138-of-000163.safetensors b/model-00138-of-000163.safetensors index ae4f256c44389bdbc40a92e7e667039d794c0ed6..ebd197e64b83e09c54d9d727152ebc0602de29ca 100644 --- a/model-00138-of-000163.safetensors +++ b/model-00138-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6a1fe7da4eaa62603aa623e28bd671e2b06f6bf8aa01a39075ae07e4a1edff7a -size 4302384963 +oid sha256:59f36ddad663da3d46dad86174c2adf6813ed3d3ce61b8b2f56314ccf8216c50 +size 8602554448 diff --git a/model-00140-of-000163.safetensors b/model-00140-of-000163.safetensors index 3fb223e6c331c0f04ba1201469c594ce34c652c0..9326f02dca72b2449451df38fc46a90fc6287c8a 100644 --- a/model-00140-of-000163.safetensors +++ b/model-00140-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d6ae521438d756a1effc1b2a55cce9f632fad975910f43360c86dda2775e7217 -size 4302384884 +oid sha256:1931c021e4d13f093938370ff49a17b820b4c1a15d502cb185af261840837540 +size 8602554408 diff --git a/model-00141-of-000163.safetensors b/model-00141-of-000163.safetensors index 18f5d61af5737fbbe3932c1f11b4c3d610b2cb48..435fdb30ce8be20d04eb4be36ab91bd1d5399290 100644 --- a/model-00141-of-000163.safetensors +++ b/model-00141-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:2e49bea9a5128a8d986d2fd42d79cef2997e637a7f5b58305c47ccc449620fc2 -size 3142388798 +oid sha256:57d6e7d990ed5f1335e8509dbdc0065248df95491dc131a7b948e9fe7e0eb1c4 +size 6283123256 diff --git a/model-00144-of-000163.safetensors b/model-00144-of-000163.safetensors index a9fbc9ed8057c1cb7566765887c2546f5412a9cb..c36df0637564edb48ad8dc9b9b3a448f117c35c2 100644 --- a/model-00144-of-000163.safetensors +++ b/model-00144-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:e44a3f3680624d3290d196eab64dfb86af8019f50bcf3a992ad7cd6638735a79 -size 4302350794 +oid sha256:c72c67e05272f9925cc321c33ce06e4cd32c485a92d766a56f35317c7cb029a7 +size 8598786704 diff --git a/model-00145-of-000163.safetensors b/model-00145-of-000163.safetensors index d6c5476856aaecca921efb8d5d7259465e880a63..08fab34e7fcc5b70a3c5fc4c132ee809ffeb5b1a 100644 --- a/model-00145-of-000163.safetensors +++ b/model-00145-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c9c978c5afe32ea1f5afc0f5f65205441a421b5eb6d1942fca8cba9e6650c224 -size 4302384518 +oid sha256:49f5c0d0ce3cd2af63462da84e0383e27c6056eec79a3872140e4a2dfbf22fc5 +size 8602554224 diff --git a/model-00146-of-000163.safetensors b/model-00146-of-000163.safetensors index 878bcb2618e8092f22a493827c490b5d57fd55e8..c887ff9756bb75a88c593b0e1568e033d56bb1e4 100644 --- a/model-00146-of-000163.safetensors +++ b/model-00146-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7f2a681f4931365b40febad455f0b73179f1a26f43735f6af3dd73b1c3d6c05a -size 4302384963 +oid sha256:026f721bf0c3a60bff6e0579c75a40f43e702673875c2e96f1b010e8144f6e9e +size 8602554448 diff --git a/model-00147-of-000163.safetensors b/model-00147-of-000163.safetensors index 15e2c0b48c2b2225eef0d9feb07647d96f1a62bd..fede93ce34b8f321f18763b766c4afd387cab01e 100644 --- a/model-00147-of-000163.safetensors +++ b/model-00147-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:14cb65858eaf602ba8604ce2be5c74c0f94a922bb492064fc2048d7e9b6efd2a -size 4302350602 +oid sha256:77b98510be58300d3bb5b62803aeb5a64cc56639e99e29b4db73a30f6a73d2bb +size 8598786608 diff --git a/model-00148-of-000163.safetensors b/model-00148-of-000163.safetensors index beb9e3fc508c5ff2e9f0849c933bbdde8a2c33c3..57c450989c73e8253367fdf714fd5f4fd4efa599 100644 --- a/model-00148-of-000163.safetensors +++ b/model-00148-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:a4185359e4e4abe44c234981089be0b2873dc1fc1b21246711873b7f18b30fe8 -size 4302384710 +oid sha256:cc3230098de1dce74f89ea69be543bd87a973feae02ba8d8598a255ebde7fb62 +size 8602554320 diff --git a/model-00149-of-000163.safetensors b/model-00149-of-000163.safetensors index 74632203eb0efd9ce1ccc90d2173b233ce761b23..18355daf9fcb68b3c28de73b36239efaeef0dafa 100644 --- a/model-00149-of-000163.safetensors +++ b/model-00149-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d9be3b4e6790c9d217e1cc8753813307c9f791b8e7f8e8c6cacdc98c08776755 -size 4302384963 +oid sha256:3b29d8e0238e99f5c9ebae14b0a761a9ae5b1ba29d66f738f288a51d9b98175c +size 8602554448 diff --git a/model-00150-of-000163.safetensors b/model-00150-of-000163.safetensors index ad310473e2576f051dad5440b0dedb4090747a6c..42afc67e5e089e92b55e78f43887662e2a963a41 100644 --- a/model-00150-of-000163.safetensors +++ b/model-00150-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:90d40cf5fb984157cd322681b021c6253f125dd51c9d8b4da986c6a97552bad7 -size 4302350432 +oid sha256:f6376b4f3180c22e6dcbbc9fbeb26f588c4f42c43b14e8849f71f6a2bcc6d9fd +size 8598786504 diff --git a/model-00151-of-000163.safetensors b/model-00151-of-000163.safetensors index 642994f17afb16b7e88adcc6d5f0499337558820..0cf6badbfd8da2f42661a809ff7a3eb29ab58533 100644 --- a/model-00151-of-000163.safetensors +++ b/model-00151-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7222b3366b2793b213134c5d8caae6569a9622b6b235e54f5500a57b80bbdf9a -size 4302384900 +oid sha256:0e43bb4fe113721c9b5672925b2363a42b030f95758c7a80f11a682ec5e0771d +size 8602554416 diff --git a/model-00152-of-000163.safetensors b/model-00152-of-000163.safetensors index 7822073bfdbba00f8edbae08d7cc7f4d0fe42ab6..7db1b5b6804373c09888bda01c82043c0f297c2f 100644 --- a/model-00152-of-000163.safetensors +++ b/model-00152-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0654913bb563ba931d8a54a15760d3619e5e1537841717c120c0e0623d1bf4e2 -size 4302350808 +oid sha256:97f35fb6e97dac5d936f1f31ba330a01cd7b9f30b4aea181681af4452923f753 +size 8598786704 diff --git a/model-00153-of-000163.safetensors b/model-00153-of-000163.safetensors index 7f3e9b7120eac5eb2c77a8e083377a3ec2061504..67e2eac7cd5f678187030c2fd48606d1eb973c53 100644 --- a/model-00153-of-000163.safetensors +++ b/model-00153-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:4e09a5eb4e1ea762c0b9a0691763cae6141b71276e4190f55a42310d8c977dc1 -size 4302384504 +oid sha256:01a29cc828089ec04d6f315f09c13f1fc1bab86e956e2d3c985e53f9e10561e8 +size 8602554224 diff --git a/model-00154-of-000163.safetensors b/model-00154-of-000163.safetensors index ac025ea41055413df085b9efcc46f7c1087c422a..7b59ab669d41472408ecbac07f553287ab90c766 100644 --- a/model-00154-of-000163.safetensors +++ b/model-00154-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ffc11b87992ce2639ff28f9ff8772ccd76a59b7409e633fc1211216155af13ab -size 4302384961 +oid sha256:5b8562973a1972c75fcd70c513406d8899e5645e2b6564aa7af899efe7522ec6 +size 8602554448 diff --git a/model-00155-of-000163.safetensors b/model-00155-of-000163.safetensors index c90378e6fcb6ed85b0bd0c4795d96851eaa1f1e5..49d41264836f5a32adcd17dbccdce7eb6363b787 100644 --- a/model-00155-of-000163.safetensors +++ b/model-00155-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:d47a88b4d7377cb4d5a5aa44943a71f5296e41dde8eeeaff40ffc7b885d07291 -size 4302350620 +oid sha256:eb284b6997fd900a2d224ecb57272a566180f714e1aeea69c497256b6568b8d2 +size 8598786616 diff --git a/model-00156-of-000163.safetensors b/model-00156-of-000163.safetensors index cb64d0616b777397d0808a787e78ebb4281b390a..69787432a4f89cd6026242b94fc685d6b6df6ef3 100644 --- a/model-00156-of-000163.safetensors +++ b/model-00156-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:eeadc5eb1bd92f99c1f42f25a6d835cfb6282274b4ed23a0ed6f3ad4148beed2 -size 4302384692 +oid sha256:54303e9b94484df81a919f7c9c2fbf50af615ebdb44b67bea9da20c0e5f1f69d +size 8602554312 diff --git a/model-00157-of-000163.safetensors b/model-00157-of-000163.safetensors index db5ece915de01003e1f5da39599fa6e781b632bb..9c9b964d39dd23ae731ede37b8541552f9cc1145 100644 --- a/model-00157-of-000163.safetensors +++ b/model-00157-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:8205af59d738aa2e952ba3e2eb66c5617c8884a86b931c31fd270005712d5692 -size 4302384963 +oid sha256:78d66e87911fbbb61d89030915d9d233f046a06f6bce552b7b90ae37299fe497 +size 8602554448 diff --git a/model-00158-of-000163.safetensors b/model-00158-of-000163.safetensors index 0af36e4d7a0c8111ff5b461c94600b1e5f576136..6722b98d66cdf954a4809879a0607d403044fd89 100644 --- a/model-00158-of-000163.safetensors +++ b/model-00158-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:c122494d667414c2cf68d7a2f0e7ffd011c6eb26bb8391afeba47932dce5a928 -size 4302350448 +oid sha256:21aee3f97b705c82b5c1ca3e0bd054857723d174a5b2783f336e875ee1accf1b +size 8598786520 diff --git a/model-00159-of-000163.safetensors b/model-00159-of-000163.safetensors index 7b957f413a4c651d20fee6934315a2fbd136ec80..02aaca7b4236357cb0f91abe4042eb8981a451e6 100644 --- a/model-00159-of-000163.safetensors +++ b/model-00159-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6e01a5c5b28be729f6d244c2a828c4427c78c3f0777cc61f61c180d185703fb2 -size 4302384884 +oid sha256:1e86648495eac2e41a872aa161e5ef9770c0ffc4ca8c000dc5adc347a305e55e +size 8602554408 diff --git a/model-00160-of-000163.safetensors b/model-00160-of-000163.safetensors index 552e142dc3ddcdc53be447fe5798804c49908ecc..c11101915907c978b5f6ab5bdd20d5802179b73f 100644 --- a/model-00160-of-000163.safetensors +++ b/model-00160-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:5163fbdd76df28fade80aabc3e071f473cb33751eaf2ecb4fa3932a5d8e77609 -size 5230637362 +oid sha256:03a81276afe58b4aa666144d58a580aeabec4aa956a39873b72108c5dfc00d16 +size 8602463472 diff --git a/model-00161-of-000163.safetensors b/model-00161-of-000163.safetensors index 48370c0b238fc8ef9846acf241cffee6c4153f03..6ea62a76a1483dcfe46159eefcdac38d4184cb99 100644 --- a/model-00161-of-000163.safetensors +++ b/model-00161-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dc4497ab378fb78f7fcebd4de0890f8f710e1409f544efe02896f4155dca9587 -size 4302384321 +oid sha256:af46e3d0b9ff605fc7566a50ca7e08d6dfc3c1fd38b036cdbb229cd611550f9a +size 8602554128 diff --git a/model-00162-of-000163.safetensors b/model-00162-of-000163.safetensors index 4b4efd5bbb7a50f249462810153938c3ebc45f08..888f5238e50c8b42f70002ff9812843e0fe519d4 100644 --- a/model-00162-of-000163.safetensors +++ b/model-00162-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:9c8582309da9422e3dd517fa9a1f93ce7bb88f7e4626748509a9c84ae8394c58 -size 4302384948 +oid sha256:753e500138404632e84b090bfba221d9557bc80d0bb3487f5c3340bb593c5a65 +size 8602554440 diff --git a/model-00163-of-000163.safetensors b/model-00163-of-000163.safetensors index f164acdff7205fac284cd0adecbff217d1815207..4c469afb3589ee5d2edbd9ae45dadd39b0dae17c 100644 --- a/model-00163-of-000163.safetensors +++ b/model-00163-of-000163.safetensors @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:0a97cb51f6a9002f817b38eac66400d3b72ffbc1b2b9ae654562bba46c904f5f -size 6584784447 +oid sha256:c322a64df2fd80b7c609a2f583d1d1bcdafbcb3ea93f60654ce5b6889ba4f257 +size 9255875920 diff --git a/model.safetensors.index.json b/model.safetensors.index.json index 210ab5c5ca880ad0003c3b0ea876eb05f3215136..5b60276c1efb766f6a1aee2e357e27407f6ed12b 100644 --- a/model.safetensors.index.json +++ b/model.safetensors.index.json @@ -1,91991 +1,46181 @@ { - "metadata": { - "total_size": 1369062772000 - }, + "metadata": {}, "weight_map": { "model.embed_tokens.weight": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", - "model.layers.0.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.mlp.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.mlp.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.mlp.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.mlp.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.0.mlp.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.0.input_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.0.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", - "model.layers.1.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.mlp.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.mlp.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.mlp.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.mlp.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.1.mlp.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.1.input_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.1.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", - "model.layers.2.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.mlp.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.mlp.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.mlp.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.mlp.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.mlp.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.2.mlp.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.2.input_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.2.post_attention_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.q_a_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.self_attn.q_a_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.q_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.q_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.self_attn.q_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.kv_a_proj_with_mqa.weight": "model-00001-of-000163.safetensors", - "model.layers.3.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.kv_a_layernorm.weight": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.kv_b_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.self_attn.kv_b_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.self_attn.o_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.self_attn.o_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.gate.weight": "model-00001-of-000163.safetensors", "model.layers.3.mlp.gate.e_score_correction_bias": "model-00001-of-000163.safetensors", "model.layers.3.mlp.shared_experts.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.shared_experts.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.shared_experts.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.shared_experts.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.shared_experts.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.0.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.0.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.0.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.0.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.0.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.0.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.1.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.1.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.1.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.1.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.1.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.1.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.2.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.2.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.2.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.2.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.2.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.2.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.3.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.3.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.3.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.3.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.3.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.3.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.4.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.4.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.4.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.4.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.4.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.4.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.5.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.5.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.5.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.5.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.5.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.5.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.6.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.6.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.6.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.6.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.6.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.6.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.7.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.7.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.7.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.7.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.7.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.7.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.8.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.8.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.8.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.8.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.8.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.8.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.9.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.9.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.9.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.9.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.9.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.9.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.10.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.10.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.10.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.10.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.10.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.10.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.11.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.11.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.11.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.11.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.11.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.11.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.12.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.12.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.12.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.12.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.12.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.12.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.13.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.13.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.13.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.13.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.13.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.13.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.14.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.14.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.14.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.14.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.14.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.14.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.15.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.15.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.15.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.15.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.15.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.15.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.16.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.16.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.16.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.16.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.16.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.16.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.17.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.17.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.17.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.17.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.17.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.17.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.18.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.18.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.18.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.18.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.18.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.18.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.19.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.19.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.19.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.19.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.19.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.19.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.20.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.20.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.20.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.20.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.20.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.20.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.21.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.21.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.21.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.21.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.21.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.21.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.22.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.22.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.22.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.22.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.22.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.22.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.23.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.23.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.23.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.23.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.23.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.23.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.24.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.24.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.24.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.24.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.24.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.24.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.25.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.25.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.25.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.25.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.25.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.25.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.26.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.26.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.26.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.26.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.26.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.26.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.27.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.27.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.27.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.27.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.27.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.27.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.28.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.28.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.28.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.28.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.28.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.28.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.29.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.29.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.29.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.29.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.29.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.29.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.30.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.30.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.30.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.30.up_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.30.down_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.30.down_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.31.gate_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.31.gate_proj.weight_scale_inv": "model-00001-of-000163.safetensors", "model.layers.3.mlp.experts.31.up_proj.weight": "model-00001-of-000163.safetensors", - "model.layers.3.mlp.experts.31.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.31.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.31.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.32.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.32.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.32.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.32.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.32.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.32.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.33.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.33.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.33.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.33.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.33.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.33.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.34.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.34.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.34.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.34.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.34.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.34.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.35.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.35.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.35.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.35.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.35.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.35.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.36.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.36.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.36.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.36.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.36.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.36.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.37.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.37.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.37.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.37.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.37.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.37.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.38.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.38.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.38.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.38.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.38.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.38.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.39.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.39.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.39.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.39.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.39.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.39.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.40.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.40.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.40.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.40.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.40.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.40.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.41.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.41.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.41.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.41.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.41.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.41.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.42.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.42.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.42.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.42.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.42.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.42.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.43.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.43.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.43.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.43.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.43.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.43.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.44.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.44.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.44.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.44.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.44.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.44.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.45.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.45.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.45.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.45.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.45.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.45.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.46.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.46.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.46.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.46.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.46.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.46.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.47.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.47.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.47.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.47.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.47.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.47.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.48.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.48.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.48.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.48.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.48.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.48.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.49.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.49.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.49.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.49.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.49.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.49.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.50.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.50.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.50.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.50.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.50.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.50.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.51.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.51.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.51.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.51.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.51.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.51.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.52.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.52.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.52.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.52.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.52.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.52.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.53.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.53.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.53.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.53.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.53.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.53.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.54.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.54.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.54.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.54.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.54.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.54.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.55.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.55.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.55.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.55.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.55.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.55.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.56.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.56.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.56.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.56.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.56.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.56.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.57.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.57.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.57.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.57.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.57.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.57.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.58.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.58.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.58.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.58.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.58.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.58.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.59.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.59.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.59.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.59.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.59.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.59.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.60.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.60.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.60.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.60.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.60.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.60.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.61.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.61.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.61.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.61.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.61.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.61.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.62.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.62.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.62.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.62.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.62.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.62.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.63.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.63.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.63.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.63.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.63.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.63.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.64.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.64.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.64.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.64.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.64.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.64.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.65.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.65.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.65.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.65.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.65.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.65.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.66.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.66.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.66.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.66.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.66.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.66.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.67.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.67.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.67.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.67.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.67.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.67.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.68.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.68.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.68.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.68.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.68.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.68.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.69.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.69.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.69.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.69.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.69.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.69.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.70.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.70.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.70.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.70.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.70.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.70.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.71.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.71.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.71.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.71.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.71.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.71.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.72.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.72.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.72.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.72.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.72.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.72.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.73.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.73.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.73.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.73.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.73.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.73.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.74.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.74.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.74.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.74.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.74.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.74.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.75.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.75.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.75.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.75.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.75.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.75.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.76.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.76.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.76.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.76.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.76.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.76.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.77.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.77.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.77.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.77.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.77.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.77.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.78.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.78.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.78.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.78.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.78.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.78.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.79.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.79.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.79.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.79.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.79.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.79.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.80.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.80.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.80.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.80.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.80.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.80.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.81.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.81.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.81.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.81.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.81.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.81.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.82.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.82.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.82.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.82.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.82.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.82.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.83.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.83.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.83.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.83.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.83.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.83.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.84.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.84.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.84.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.84.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.84.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.84.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.85.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.85.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.85.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.85.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.85.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.85.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.86.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.86.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.86.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.86.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.86.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.86.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.87.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.87.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.87.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.87.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.87.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.87.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.88.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.88.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.88.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.88.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.88.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.88.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.89.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.89.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.89.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.89.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.89.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.89.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.90.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.90.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.90.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.90.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.90.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.90.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.91.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.91.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.91.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.91.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.91.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.91.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.92.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.92.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.92.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.92.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.92.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.92.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.93.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.93.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.93.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.93.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.93.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.93.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.94.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.94.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.94.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.94.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.94.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.94.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.95.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.95.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.95.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.95.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.95.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.95.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.96.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.96.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.96.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.96.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.96.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.96.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.97.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.97.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.97.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.97.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.97.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.97.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.98.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.98.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.98.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.98.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.98.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.98.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.99.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.99.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.99.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.99.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.99.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.99.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.100.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.100.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.100.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.100.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.100.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.100.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.101.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.101.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.101.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.101.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.101.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.101.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.102.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.102.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.102.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.102.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.102.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.102.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.103.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.103.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.103.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.103.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.103.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.103.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.104.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.104.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.104.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.104.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.104.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.104.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.105.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.105.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.105.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.105.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.105.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.105.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.106.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.106.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.106.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.106.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.106.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.106.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.107.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.107.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.107.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.107.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.107.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.107.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.108.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.108.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.108.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.108.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.108.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.108.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.109.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.109.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.109.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.109.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.109.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.109.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.110.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.110.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.110.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.110.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.110.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.110.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.111.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.111.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.111.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.111.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.111.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.111.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.112.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.112.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.112.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.112.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.112.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.112.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.113.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.113.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.113.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.113.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.113.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.113.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.114.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.114.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.114.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.114.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.114.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.114.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.115.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.115.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.115.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.115.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.115.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.115.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.116.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.116.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.116.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.116.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.116.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.116.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.117.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.117.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.117.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.117.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.117.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.117.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.118.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.118.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.118.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.118.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.118.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.118.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.119.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.119.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.119.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.119.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.119.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.119.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.120.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.120.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.120.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.120.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.120.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.120.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.121.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.121.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.121.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.121.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.121.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.121.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.122.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.122.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.122.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.122.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.122.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.122.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.123.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.123.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.123.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.123.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.123.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.123.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.124.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.124.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.124.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.124.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.124.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.124.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.125.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.125.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.125.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.125.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.125.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.125.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.126.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.126.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.126.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.126.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.126.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.126.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.127.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.127.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.127.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.127.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.127.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.127.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.128.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.128.gate_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.128.up_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.128.up_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.128.down_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.128.down_proj.weight_scale_inv": "model-00002-of-000163.safetensors", "model.layers.3.mlp.experts.129.gate_proj.weight": "model-00002-of-000163.safetensors", - "model.layers.3.mlp.experts.129.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.129.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.129.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.129.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.129.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.130.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.130.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.130.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.130.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.130.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.130.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.131.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.131.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.131.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.131.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.131.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.131.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.132.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.132.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.132.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.132.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.132.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.132.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.133.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.133.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.133.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.133.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.133.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.133.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.134.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.134.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.134.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.134.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.134.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.134.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.135.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.135.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.135.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.135.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.135.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.135.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.136.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.136.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.136.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.136.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.136.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.136.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.137.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.137.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.137.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.137.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.137.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.137.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.138.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.138.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.138.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.138.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.138.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.138.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.139.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.139.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.139.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.139.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.139.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.139.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.140.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.140.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.140.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.140.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.140.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.140.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.141.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.141.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.141.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.141.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.141.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.141.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.142.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.142.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.142.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.142.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.142.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.142.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.143.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.143.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.143.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.143.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.143.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.143.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.144.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.144.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.144.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.144.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.144.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.144.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.145.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.145.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.145.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.145.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.145.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.145.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.146.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.146.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.146.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.146.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.146.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.146.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.147.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.147.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.147.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.147.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.147.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.147.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.148.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.148.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.148.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.148.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.148.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.148.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.149.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.149.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.149.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.149.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.149.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.149.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.150.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.150.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.150.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.150.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.150.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.150.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.151.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.151.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.151.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.151.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.151.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.151.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.152.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.152.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.152.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.152.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.152.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.152.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.153.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.153.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.153.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.153.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.153.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.153.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.154.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.154.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.154.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.154.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.154.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.154.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.155.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.155.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.155.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.155.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.155.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.155.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.156.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.156.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.156.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.156.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.156.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.156.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.157.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.157.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.157.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.157.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.157.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.157.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.158.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.158.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.158.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.158.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.158.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.158.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.159.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.159.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.159.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.159.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.159.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.159.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.160.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.160.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.160.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.160.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.160.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.160.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.161.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.161.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.161.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.161.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.161.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.161.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.162.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.162.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.162.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.162.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.162.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.162.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.163.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.163.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.163.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.163.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.163.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.163.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.164.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.164.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.164.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.164.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.164.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.164.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.165.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.165.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.165.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.165.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.165.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.165.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.166.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.166.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.166.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.166.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.166.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.166.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.167.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.167.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.167.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.167.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.167.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.167.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.168.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.168.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.168.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.168.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.168.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.168.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.169.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.169.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.169.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.169.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.169.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.169.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.170.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.170.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.170.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.170.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.170.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.170.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.171.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.171.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.171.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.171.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.171.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.171.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.172.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.172.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.172.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.172.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.172.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.172.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.173.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.173.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.173.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.173.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.173.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.173.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.174.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.174.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.174.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.174.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.174.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.174.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.175.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.175.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.175.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.175.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.175.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.175.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.176.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.176.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.176.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.176.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.176.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.176.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.177.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.177.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.177.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.177.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.177.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.177.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.178.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.178.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.178.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.178.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.178.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.178.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.179.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.179.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.179.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.179.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.179.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.179.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.180.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.180.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.180.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.180.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.180.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.180.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.181.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.181.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.181.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.181.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.181.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.181.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.182.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.182.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.182.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.182.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.182.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.182.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.183.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.183.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.183.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.183.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.183.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.183.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.184.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.184.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.184.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.184.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.184.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.184.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.185.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.185.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.185.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.185.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.185.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.185.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.186.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.186.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.186.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.186.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.186.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.186.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.187.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.187.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.187.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.187.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.187.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.187.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.188.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.188.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.188.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.188.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.188.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.188.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.189.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.189.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.189.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.189.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.189.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.189.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.190.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.190.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.190.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.190.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.190.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.190.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.191.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.191.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.191.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.191.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.191.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.191.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.192.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.192.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.192.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.192.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.192.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.192.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.193.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.193.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.193.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.193.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.193.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.193.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.194.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.194.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.194.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.194.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.194.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.194.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.195.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.195.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.195.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.195.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.195.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.195.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.196.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.196.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.196.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.196.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.196.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.196.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.197.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.197.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.197.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.197.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.197.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.197.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.198.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.198.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.198.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.198.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.198.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.198.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.199.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.199.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.199.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.199.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.199.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.199.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.200.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.200.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.200.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.200.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.200.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.200.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.201.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.201.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.201.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.201.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.201.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.201.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.202.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.202.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.202.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.202.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.202.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.202.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.203.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.203.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.203.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.203.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.203.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.203.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.204.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.204.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.204.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.204.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.204.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.204.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.205.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.205.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.205.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.205.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.205.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.205.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.206.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.206.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.206.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.206.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.206.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.206.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.207.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.207.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.207.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.207.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.207.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.207.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.208.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.208.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.208.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.208.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.208.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.208.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.209.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.209.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.209.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.209.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.209.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.209.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.210.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.210.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.210.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.210.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.210.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.210.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.211.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.211.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.211.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.211.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.211.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.211.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.212.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.212.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.212.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.212.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.212.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.212.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.213.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.213.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.213.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.213.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.213.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.213.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.214.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.214.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.214.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.214.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.214.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.214.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.215.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.215.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.215.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.215.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.215.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.215.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.216.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.216.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.216.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.216.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.216.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.216.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.217.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.217.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.217.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.217.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.217.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.217.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.218.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.218.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.218.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.218.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.218.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.218.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.219.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.219.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.219.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.219.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.219.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.219.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.220.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.220.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.220.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.220.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.220.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.220.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.221.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.221.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.221.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.221.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.221.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.221.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.222.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.222.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.222.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.222.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.222.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.222.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.223.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.223.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.223.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.223.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.223.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.223.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.224.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.224.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.224.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.224.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.224.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.224.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.225.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.225.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.225.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.225.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.225.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.225.down_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.226.gate_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.226.gate_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.226.up_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.226.up_proj.weight_scale_inv": "model-00003-of-000163.safetensors", "model.layers.3.mlp.experts.226.down_proj.weight": "model-00003-of-000163.safetensors", - "model.layers.3.mlp.experts.226.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.227.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.227.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.227.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.227.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.227.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.227.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.228.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.228.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.228.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.228.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.228.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.228.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.229.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.229.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.229.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.229.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.229.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.229.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.230.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.230.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.230.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.230.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.230.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.230.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.231.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.231.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.231.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.231.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.231.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.231.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.232.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.232.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.232.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.232.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.232.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.232.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.233.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.233.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.233.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.233.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.233.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.233.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.234.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.234.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.234.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.234.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.234.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.234.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.235.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.235.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.235.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.235.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.235.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.235.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.236.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.236.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.236.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.236.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.236.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.236.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.237.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.237.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.237.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.237.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.237.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.237.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.238.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.238.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.238.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.238.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.238.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.238.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.239.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.239.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.239.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.239.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.239.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.239.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.240.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.240.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.240.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.240.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.240.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.240.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.241.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.241.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.241.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.241.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.241.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.241.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.242.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.242.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.242.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.242.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.242.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.242.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.243.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.243.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.243.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.243.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.243.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.243.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.244.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.244.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.244.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.244.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.244.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.244.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.245.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.245.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.245.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.245.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.245.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.245.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.246.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.246.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.246.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.246.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.246.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.246.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.247.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.247.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.247.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.247.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.247.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.247.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.248.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.248.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.248.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.248.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.248.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.248.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.249.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.249.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.249.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.249.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.249.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.249.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.250.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.250.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.250.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.250.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.250.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.250.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.251.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.251.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.251.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.251.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.251.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.251.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.252.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.252.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.252.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.252.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.252.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.252.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.253.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.253.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.253.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.253.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.253.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.253.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.254.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.254.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.254.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.254.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.254.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.254.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.255.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.255.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.255.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.255.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.mlp.experts.255.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.3.mlp.experts.255.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.3.input_layernorm.weight": "model-00004-of-000163.safetensors", "model.layers.3.post_attention_layernorm.weight": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.q_a_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.self_attn.q_a_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.q_a_layernorm.weight": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.q_b_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.self_attn.q_b_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.kv_a_proj_with_mqa.weight": "model-00004-of-000163.safetensors", - "model.layers.4.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.kv_a_layernorm.weight": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.kv_b_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.self_attn.kv_b_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.self_attn.o_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.self_attn.o_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.gate.weight": "model-00004-of-000163.safetensors", "model.layers.4.mlp.gate.e_score_correction_bias": "model-00004-of-000163.safetensors", "model.layers.4.mlp.shared_experts.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.shared_experts.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.shared_experts.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.shared_experts.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.shared_experts.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.0.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.0.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.0.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.0.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.0.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.0.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.1.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.1.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.1.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.1.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.1.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.1.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.2.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.2.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.2.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.2.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.2.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.2.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.3.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.3.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.3.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.3.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.3.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.3.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.4.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.4.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.4.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.4.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.4.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.4.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.5.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.5.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.5.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.5.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.5.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.5.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.6.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.6.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.6.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.6.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.6.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.6.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.7.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.7.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.7.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.7.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.7.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.7.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.8.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.8.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.8.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.8.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.8.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.8.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.9.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.9.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.9.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.9.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.9.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.9.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.10.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.10.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.10.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.10.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.10.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.10.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.11.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.11.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.11.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.11.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.11.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.11.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.12.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.12.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.12.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.12.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.12.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.12.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.13.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.13.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.13.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.13.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.13.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.13.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.14.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.14.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.14.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.14.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.14.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.14.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.15.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.15.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.15.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.15.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.15.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.15.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.16.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.16.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.16.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.16.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.16.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.16.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.17.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.17.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.17.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.17.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.17.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.17.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.18.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.18.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.18.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.18.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.18.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.18.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.19.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.19.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.19.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.19.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.19.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.19.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.20.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.20.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.20.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.20.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.20.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.20.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.21.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.21.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.21.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.21.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.21.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.21.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.22.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.22.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.22.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.22.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.22.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.22.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.23.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.23.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.23.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.23.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.23.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.23.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.24.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.24.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.24.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.24.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.24.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.24.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.25.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.25.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.25.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.25.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.25.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.25.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.26.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.26.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.26.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.26.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.26.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.26.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.27.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.27.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.27.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.27.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.27.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.27.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.28.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.28.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.28.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.28.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.28.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.28.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.29.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.29.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.29.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.29.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.29.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.29.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.30.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.30.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.30.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.30.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.30.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.30.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.31.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.31.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.31.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.31.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.31.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.31.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.32.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.32.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.32.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.32.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.32.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.32.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.33.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.33.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.33.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.33.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.33.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.33.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.34.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.34.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.34.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.34.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.34.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.34.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.35.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.35.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.35.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.35.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.35.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.35.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.36.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.36.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.36.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.36.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.36.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.36.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.37.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.37.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.37.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.37.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.37.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.37.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.38.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.38.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.38.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.38.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.38.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.38.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.39.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.39.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.39.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.39.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.39.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.39.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.40.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.40.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.40.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.40.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.40.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.40.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.41.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.41.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.41.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.41.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.41.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.41.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.42.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.42.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.42.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.42.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.42.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.42.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.43.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.43.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.43.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.43.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.43.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.43.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.44.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.44.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.44.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.44.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.44.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.44.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.45.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.45.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.45.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.45.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.45.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.45.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.46.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.46.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.46.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.46.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.46.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.46.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.47.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.47.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.47.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.47.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.47.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.47.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.48.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.48.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.48.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.48.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.48.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.48.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.49.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.49.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.49.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.49.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.49.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.49.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.50.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.50.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.50.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.50.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.50.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.50.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.51.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.51.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.51.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.51.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.51.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.51.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.52.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.52.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.52.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.52.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.52.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.52.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.53.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.53.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.53.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.53.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.53.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.53.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.54.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.54.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.54.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.54.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.54.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.54.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.55.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.55.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.55.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.55.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.55.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.55.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.56.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.56.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.56.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.56.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.56.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.56.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.57.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.57.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.57.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.57.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.57.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.57.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.58.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.58.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.58.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.58.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.58.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.58.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.59.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.59.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.59.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.59.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.59.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.59.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.60.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.60.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.60.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.60.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.60.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.60.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.61.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.61.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.61.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.61.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.61.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.61.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.62.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.62.gate_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.62.up_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.62.up_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.62.down_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.62.down_proj.weight_scale_inv": "model-00004-of-000163.safetensors", "model.layers.4.mlp.experts.63.gate_proj.weight": "model-00004-of-000163.safetensors", - "model.layers.4.mlp.experts.63.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.63.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.63.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.63.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.63.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.64.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.64.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.64.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.64.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.64.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.64.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.65.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.65.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.65.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.65.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.65.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.65.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.66.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.66.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.66.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.66.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.66.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.66.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.67.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.67.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.67.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.67.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.67.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.67.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.68.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.68.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.68.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.68.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.68.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.68.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.69.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.69.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.69.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.69.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.69.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.69.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.70.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.70.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.70.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.70.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.70.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.70.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.71.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.71.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.71.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.71.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.71.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.71.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.72.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.72.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.72.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.72.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.72.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.72.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.73.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.73.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.73.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.73.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.73.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.73.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.74.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.74.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.74.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.74.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.74.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.74.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.75.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.75.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.75.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.75.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.75.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.75.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.76.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.76.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.76.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.76.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.76.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.76.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.77.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.77.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.77.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.77.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.77.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.77.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.78.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.78.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.78.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.78.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.78.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.78.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.79.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.79.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.79.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.79.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.79.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.79.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.80.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.80.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.80.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.80.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.80.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.80.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.81.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.81.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.81.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.81.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.81.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.81.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.82.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.82.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.82.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.82.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.82.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.82.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.83.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.83.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.83.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.83.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.83.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.83.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.84.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.84.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.84.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.84.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.84.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.84.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.85.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.85.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.85.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.85.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.85.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.85.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.86.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.86.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.86.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.86.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.86.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.86.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.87.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.87.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.87.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.87.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.87.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.87.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.88.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.88.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.88.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.88.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.88.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.88.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.89.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.89.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.89.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.89.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.89.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.89.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.90.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.90.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.90.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.90.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.90.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.90.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.91.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.91.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.91.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.91.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.91.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.91.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.92.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.92.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.92.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.92.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.92.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.92.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.93.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.93.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.93.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.93.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.93.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.93.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.94.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.94.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.94.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.94.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.94.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.94.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.95.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.95.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.95.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.95.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.95.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.95.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.96.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.96.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.96.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.96.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.96.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.96.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.97.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.97.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.97.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.97.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.97.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.97.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.98.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.98.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.98.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.98.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.98.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.98.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.99.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.99.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.99.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.99.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.99.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.99.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.100.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.100.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.100.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.100.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.100.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.100.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.101.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.101.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.101.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.101.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.101.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.101.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.102.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.102.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.102.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.102.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.102.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.102.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.103.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.103.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.103.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.103.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.103.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.103.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.104.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.104.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.104.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.104.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.104.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.104.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.105.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.105.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.105.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.105.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.105.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.105.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.106.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.106.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.106.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.106.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.106.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.106.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.107.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.107.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.107.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.107.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.107.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.107.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.108.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.108.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.108.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.108.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.108.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.108.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.109.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.109.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.109.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.109.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.109.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.109.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.110.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.110.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.110.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.110.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.110.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.110.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.111.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.111.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.111.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.111.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.111.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.111.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.112.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.112.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.112.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.112.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.112.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.112.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.113.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.113.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.113.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.113.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.113.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.113.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.114.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.114.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.114.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.114.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.114.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.114.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.115.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.115.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.115.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.115.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.115.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.115.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.116.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.116.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.116.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.116.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.116.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.116.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.117.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.117.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.117.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.117.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.117.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.117.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.118.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.118.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.118.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.118.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.118.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.118.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.119.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.119.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.119.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.119.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.119.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.119.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.120.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.120.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.120.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.120.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.120.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.120.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.121.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.121.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.121.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.121.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.121.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.121.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.122.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.122.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.122.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.122.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.122.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.122.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.123.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.123.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.123.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.123.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.123.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.123.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.124.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.124.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.124.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.124.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.124.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.124.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.125.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.125.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.125.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.125.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.125.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.125.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.126.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.126.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.126.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.126.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.126.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.126.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.127.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.127.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.127.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.127.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.127.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.127.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.128.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.128.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.128.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.128.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.128.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.128.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.129.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.129.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.129.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.129.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.129.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.129.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.130.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.130.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.130.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.130.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.130.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.130.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.131.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.131.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.131.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.131.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.131.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.131.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.132.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.132.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.132.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.132.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.132.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.132.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.133.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.133.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.133.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.133.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.133.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.133.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.134.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.134.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.134.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.134.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.134.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.134.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.135.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.135.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.135.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.135.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.135.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.135.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.136.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.136.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.136.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.136.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.136.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.136.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.137.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.137.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.137.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.137.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.137.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.137.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.138.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.138.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.138.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.138.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.138.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.138.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.139.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.139.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.139.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.139.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.139.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.139.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.140.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.140.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.140.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.140.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.140.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.140.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.141.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.141.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.141.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.141.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.141.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.141.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.142.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.142.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.142.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.142.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.142.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.142.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.143.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.143.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.143.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.143.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.143.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.143.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.144.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.144.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.144.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.144.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.144.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.144.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.145.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.145.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.145.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.145.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.145.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.145.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.146.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.146.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.146.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.146.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.146.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.146.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.147.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.147.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.147.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.147.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.147.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.147.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.148.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.148.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.148.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.148.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.148.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.148.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.149.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.149.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.149.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.149.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.149.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.149.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.150.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.150.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.150.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.150.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.150.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.150.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.151.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.151.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.151.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.151.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.151.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.151.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.152.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.152.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.152.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.152.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.152.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.152.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.153.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.153.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.153.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.153.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.153.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.153.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.154.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.154.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.154.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.154.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.154.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.154.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.155.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.155.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.155.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.155.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.155.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.155.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.156.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.156.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.156.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.156.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.156.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.156.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.157.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.157.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.157.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.157.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.157.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.157.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.158.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.158.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.158.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.158.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.158.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.158.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.159.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.159.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.159.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.159.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.159.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.159.down_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.160.gate_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.160.gate_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.160.up_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.160.up_proj.weight_scale_inv": "model-00005-of-000163.safetensors", "model.layers.4.mlp.experts.160.down_proj.weight": "model-00005-of-000163.safetensors", - "model.layers.4.mlp.experts.160.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.161.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.161.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.161.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.161.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.161.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.161.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.162.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.162.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.162.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.162.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.162.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.162.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.163.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.163.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.163.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.163.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.163.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.163.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.164.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.164.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.164.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.164.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.164.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.164.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.165.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.165.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.165.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.165.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.165.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.165.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.166.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.166.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.166.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.166.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.166.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.166.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.167.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.167.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.167.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.167.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.167.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.167.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.168.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.168.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.168.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.168.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.168.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.168.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.169.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.169.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.169.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.169.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.169.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.169.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.170.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.170.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.170.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.170.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.170.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.170.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.171.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.171.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.171.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.171.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.171.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.171.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.172.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.172.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.172.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.172.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.172.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.172.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.173.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.173.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.173.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.173.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.173.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.173.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.174.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.174.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.174.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.174.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.174.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.174.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.175.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.175.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.175.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.175.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.175.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.175.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.176.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.176.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.176.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.176.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.176.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.176.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.177.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.177.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.177.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.177.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.177.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.177.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.178.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.178.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.178.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.178.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.178.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.178.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.179.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.179.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.179.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.179.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.179.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.179.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.180.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.180.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.180.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.180.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.180.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.180.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.181.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.181.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.181.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.181.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.181.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.181.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.182.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.182.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.182.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.182.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.182.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.182.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.183.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.183.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.183.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.183.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.183.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.183.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.184.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.184.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.184.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.184.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.184.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.184.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.185.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.185.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.185.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.185.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.185.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.185.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.186.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.186.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.186.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.186.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.186.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.186.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.187.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.187.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.187.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.187.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.187.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.187.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.188.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.188.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.188.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.188.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.188.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.188.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.189.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.189.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.189.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.189.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.189.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.189.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.190.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.190.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.190.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.190.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.190.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.190.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.191.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.191.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.191.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.191.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.191.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.191.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.192.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.192.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.192.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.192.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.192.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.192.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.193.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.193.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.193.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.193.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.193.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.193.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.194.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.194.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.194.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.194.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.194.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.194.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.195.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.195.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.195.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.195.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.195.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.195.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.196.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.196.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.196.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.196.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.196.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.196.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.197.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.197.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.197.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.197.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.197.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.197.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.198.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.198.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.198.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.198.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.198.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.198.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.199.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.199.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.199.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.199.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.199.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.199.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.200.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.200.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.200.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.200.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.200.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.200.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.201.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.201.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.201.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.201.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.201.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.201.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.202.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.202.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.202.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.202.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.202.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.202.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.203.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.203.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.203.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.203.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.203.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.203.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.204.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.204.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.204.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.204.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.204.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.204.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.205.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.205.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.205.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.205.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.205.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.205.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.206.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.206.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.206.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.206.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.206.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.206.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.207.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.207.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.207.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.207.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.207.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.207.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.208.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.208.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.208.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.208.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.208.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.208.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.209.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.209.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.209.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.209.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.209.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.209.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.210.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.210.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.210.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.210.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.210.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.210.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.211.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.211.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.211.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.211.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.211.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.211.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.212.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.212.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.212.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.212.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.212.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.212.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.213.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.213.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.213.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.213.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.213.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.213.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.214.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.214.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.214.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.214.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.214.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.214.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.215.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.215.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.215.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.215.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.215.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.215.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.216.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.216.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.216.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.216.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.216.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.216.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.217.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.217.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.217.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.217.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.217.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.217.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.218.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.218.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.218.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.218.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.218.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.218.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.219.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.219.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.219.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.219.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.219.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.219.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.220.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.220.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.220.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.220.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.220.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.220.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.221.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.221.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.221.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.221.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.221.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.221.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.222.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.222.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.222.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.222.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.222.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.222.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.223.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.223.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.223.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.223.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.223.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.223.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.224.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.224.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.224.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.224.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.224.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.224.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.225.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.225.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.225.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.225.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.225.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.225.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.226.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.226.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.226.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.226.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.226.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.226.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.227.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.227.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.227.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.227.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.227.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.227.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.228.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.228.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.228.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.228.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.228.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.228.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.229.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.229.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.229.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.229.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.229.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.229.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.230.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.230.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.230.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.230.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.230.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.230.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.231.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.231.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.231.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.231.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.231.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.231.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.232.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.232.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.232.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.232.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.232.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.232.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.233.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.233.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.233.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.233.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.233.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.233.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.234.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.234.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.234.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.234.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.234.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.234.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.235.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.235.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.235.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.235.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.235.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.235.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.236.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.236.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.236.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.236.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.236.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.236.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.237.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.237.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.237.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.237.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.237.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.237.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.238.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.238.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.238.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.238.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.238.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.238.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.239.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.239.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.239.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.239.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.239.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.239.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.240.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.240.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.240.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.240.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.240.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.240.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.241.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.241.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.241.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.241.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.241.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.241.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.242.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.242.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.242.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.242.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.242.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.242.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.243.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.243.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.243.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.243.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.243.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.243.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.244.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.244.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.244.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.244.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.244.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.244.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.245.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.245.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.245.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.245.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.245.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.245.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.246.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.246.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.246.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.246.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.246.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.246.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.247.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.247.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.247.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.247.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.247.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.247.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.248.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.248.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.248.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.248.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.248.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.248.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.249.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.249.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.249.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.249.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.249.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.249.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.250.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.250.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.250.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.250.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.250.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.250.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.251.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.251.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.251.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.251.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.251.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.251.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.252.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.252.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.252.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.252.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.252.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.252.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.253.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.253.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.253.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.253.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.253.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.253.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.254.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.254.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.254.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.254.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.254.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.254.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.255.gate_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.255.gate_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.255.up_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.255.up_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.mlp.experts.255.down_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.4.mlp.experts.255.down_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.4.input_layernorm.weight": "model-00006-of-000163.safetensors", "model.layers.4.post_attention_layernorm.weight": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.q_a_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.5.self_attn.q_a_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.q_a_layernorm.weight": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.q_b_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.5.self_attn.q_b_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.kv_a_proj_with_mqa.weight": "model-00006-of-000163.safetensors", - "model.layers.5.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.kv_a_layernorm.weight": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.kv_b_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.5.self_attn.kv_b_proj.weight_scale_inv": "model-00006-of-000163.safetensors", "model.layers.5.self_attn.o_proj.weight": "model-00006-of-000163.safetensors", - "model.layers.5.self_attn.o_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.gate.weight": "model-00007-of-000163.safetensors", "model.layers.5.mlp.gate.e_score_correction_bias": "model-00007-of-000163.safetensors", "model.layers.5.mlp.shared_experts.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.shared_experts.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.shared_experts.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.shared_experts.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.shared_experts.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.0.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.0.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.0.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.0.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.0.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.0.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.1.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.1.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.1.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.1.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.1.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.1.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.2.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.2.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.2.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.2.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.2.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.2.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.3.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.3.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.3.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.3.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.3.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.3.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.4.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.4.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.4.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.4.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.4.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.4.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.5.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.5.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.5.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.5.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.5.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.5.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.6.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.6.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.6.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.6.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.6.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.6.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.7.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.7.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.7.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.7.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.7.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.7.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.8.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.8.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.8.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.8.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.8.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.8.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.9.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.9.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.9.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.9.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.9.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.9.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.10.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.10.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.10.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.10.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.10.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.10.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.11.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.11.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.11.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.11.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.11.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.11.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.12.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.12.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.12.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.12.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.12.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.12.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.13.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.13.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.13.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.13.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.13.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.13.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.14.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.14.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.14.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.14.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.14.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.14.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.15.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.15.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.15.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.15.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.15.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.15.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.16.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.16.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.16.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.16.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.16.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.16.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.17.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.17.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.17.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.17.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.17.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.17.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.18.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.18.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.18.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.18.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.18.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.18.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.19.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.19.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.19.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.19.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.19.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.19.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.20.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.20.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.20.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.20.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.20.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.20.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.21.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.21.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.21.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.21.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.21.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.21.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.22.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.22.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.22.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.22.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.22.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.22.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.23.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.23.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.23.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.23.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.23.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.23.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.24.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.24.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.24.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.24.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.24.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.24.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.25.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.25.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.25.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.25.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.25.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.25.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.26.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.26.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.26.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.26.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.26.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.26.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.27.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.27.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.27.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.27.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.27.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.27.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.28.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.28.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.28.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.28.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.28.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.28.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.29.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.29.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.29.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.29.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.29.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.29.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.30.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.30.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.30.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.30.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.30.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.30.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.31.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.31.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.31.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.31.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.31.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.31.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.32.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.32.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.32.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.32.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.32.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.32.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.33.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.33.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.33.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.33.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.33.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.33.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.34.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.34.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.34.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.34.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.34.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.34.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.35.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.35.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.35.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.35.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.35.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.35.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.36.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.36.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.36.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.36.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.36.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.36.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.37.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.37.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.37.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.37.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.37.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.37.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.38.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.38.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.38.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.38.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.38.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.38.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.39.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.39.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.39.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.39.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.39.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.39.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.40.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.40.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.40.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.40.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.40.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.40.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.41.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.41.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.41.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.41.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.41.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.41.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.42.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.42.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.42.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.42.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.42.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.42.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.43.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.43.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.43.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.43.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.43.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.43.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.44.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.44.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.44.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.44.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.44.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.44.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.45.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.45.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.45.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.45.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.45.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.45.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.46.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.46.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.46.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.46.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.46.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.46.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.47.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.47.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.47.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.47.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.47.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.47.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.48.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.48.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.48.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.48.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.48.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.48.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.49.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.49.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.49.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.49.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.49.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.49.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.50.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.50.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.50.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.50.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.50.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.50.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.51.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.51.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.51.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.51.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.51.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.51.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.52.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.52.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.52.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.52.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.52.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.52.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.53.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.53.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.53.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.53.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.53.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.53.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.54.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.54.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.54.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.54.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.54.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.54.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.55.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.55.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.55.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.55.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.55.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.55.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.56.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.56.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.56.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.56.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.56.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.56.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.57.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.57.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.57.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.57.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.57.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.57.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.58.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.58.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.58.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.58.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.58.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.58.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.59.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.59.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.59.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.59.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.59.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.59.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.60.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.60.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.60.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.60.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.60.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.60.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.61.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.61.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.61.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.61.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.61.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.61.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.62.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.62.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.62.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.62.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.62.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.62.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.63.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.63.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.63.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.63.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.63.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.63.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.64.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.64.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.64.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.64.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.64.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.64.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.65.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.65.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.65.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.65.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.65.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.65.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.66.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.66.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.66.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.66.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.66.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.66.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.67.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.67.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.67.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.67.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.67.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.67.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.68.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.68.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.68.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.68.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.68.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.68.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.69.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.69.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.69.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.69.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.69.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.69.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.70.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.70.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.70.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.70.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.70.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.70.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.71.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.71.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.71.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.71.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.71.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.71.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.72.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.72.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.72.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.72.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.72.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.72.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.73.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.73.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.73.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.73.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.73.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.73.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.74.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.74.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.74.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.74.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.74.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.74.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.75.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.75.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.75.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.75.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.75.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.75.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.76.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.76.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.76.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.76.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.76.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.76.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.77.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.77.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.77.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.77.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.77.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.77.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.78.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.78.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.78.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.78.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.78.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.78.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.79.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.79.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.79.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.79.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.79.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.79.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.80.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.80.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.80.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.80.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.80.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.80.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.81.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.81.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.81.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.81.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.81.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.81.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.82.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.82.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.82.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.82.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.82.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.82.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.83.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.83.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.83.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.83.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.83.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.83.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.84.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.84.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.84.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.84.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.84.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.84.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.85.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.85.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.85.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.85.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.85.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.85.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.86.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.86.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.86.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.86.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.86.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.86.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.87.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.87.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.87.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.87.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.87.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.87.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.88.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.88.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.88.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.88.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.88.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.88.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.89.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.89.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.89.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.89.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.89.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.89.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.90.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.90.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.90.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.90.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.90.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.90.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.91.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.91.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.91.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.91.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.91.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.91.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.92.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.92.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.92.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.92.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.92.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.92.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.93.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.93.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.93.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.93.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.93.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.93.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.94.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.94.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.94.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.94.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.94.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.94.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.95.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.95.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.95.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.95.up_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.95.down_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.95.down_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.96.gate_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.96.gate_proj.weight_scale_inv": "model-00007-of-000163.safetensors", "model.layers.5.mlp.experts.96.up_proj.weight": "model-00007-of-000163.safetensors", - "model.layers.5.mlp.experts.96.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.96.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.96.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.97.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.97.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.97.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.97.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.97.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.97.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.98.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.98.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.98.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.98.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.98.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.98.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.99.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.99.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.99.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.99.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.99.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.99.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.100.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.100.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.100.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.100.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.100.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.100.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.101.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.101.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.101.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.101.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.101.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.101.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.102.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.102.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.102.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.102.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.102.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.102.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.103.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.103.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.103.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.103.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.103.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.103.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.104.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.104.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.104.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.104.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.104.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.104.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.105.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.105.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.105.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.105.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.105.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.105.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.106.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.106.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.106.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.106.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.106.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.106.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.107.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.107.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.107.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.107.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.107.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.107.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.108.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.108.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.108.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.108.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.108.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.108.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.109.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.109.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.109.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.109.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.109.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.109.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.110.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.110.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.110.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.110.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.110.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.110.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.111.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.111.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.111.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.111.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.111.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.111.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.112.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.112.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.112.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.112.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.112.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.112.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.113.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.113.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.113.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.113.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.113.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.113.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.114.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.114.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.114.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.114.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.114.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.114.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.115.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.115.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.115.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.115.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.115.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.115.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.116.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.116.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.116.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.116.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.116.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.116.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.117.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.117.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.117.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.117.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.117.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.117.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.118.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.118.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.118.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.118.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.118.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.118.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.119.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.119.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.119.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.119.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.119.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.119.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.120.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.120.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.120.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.120.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.120.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.120.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.121.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.121.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.121.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.121.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.121.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.121.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.122.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.122.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.122.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.122.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.122.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.122.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.123.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.123.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.123.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.123.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.123.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.123.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.124.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.124.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.124.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.124.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.124.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.124.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.125.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.125.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.125.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.125.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.125.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.125.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.126.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.126.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.126.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.126.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.126.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.126.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.127.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.127.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.127.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.127.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.127.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.127.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.128.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.128.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.128.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.128.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.128.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.128.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.129.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.129.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.129.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.129.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.129.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.129.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.130.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.130.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.130.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.130.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.130.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.130.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.131.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.131.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.131.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.131.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.131.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.131.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.132.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.132.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.132.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.132.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.132.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.132.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.133.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.133.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.133.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.133.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.133.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.133.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.134.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.134.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.134.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.134.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.134.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.134.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.135.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.135.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.135.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.135.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.135.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.135.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.136.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.136.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.136.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.136.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.136.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.136.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.137.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.137.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.137.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.137.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.137.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.137.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.138.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.138.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.138.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.138.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.138.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.138.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.139.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.139.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.139.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.139.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.139.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.139.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.140.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.140.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.140.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.140.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.140.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.140.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.141.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.141.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.141.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.141.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.141.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.141.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.142.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.142.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.142.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.142.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.142.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.142.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.143.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.143.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.143.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.143.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.143.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.143.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.144.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.144.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.144.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.144.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.144.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.144.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.145.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.145.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.145.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.145.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.145.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.145.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.146.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.146.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.146.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.146.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.146.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.146.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.147.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.147.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.147.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.147.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.147.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.147.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.148.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.148.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.148.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.148.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.148.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.148.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.149.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.149.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.149.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.149.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.149.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.149.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.150.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.150.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.150.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.150.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.150.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.150.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.151.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.151.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.151.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.151.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.151.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.151.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.152.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.152.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.152.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.152.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.152.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.152.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.153.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.153.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.153.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.153.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.153.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.153.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.154.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.154.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.154.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.154.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.154.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.154.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.155.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.155.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.155.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.155.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.155.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.155.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.156.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.156.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.156.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.156.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.156.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.156.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.157.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.157.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.157.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.157.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.157.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.157.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.158.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.158.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.158.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.158.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.158.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.158.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.159.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.159.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.159.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.159.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.159.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.159.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.160.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.160.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.160.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.160.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.160.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.160.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.161.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.161.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.161.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.161.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.161.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.161.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.162.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.162.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.162.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.162.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.162.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.162.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.163.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.163.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.163.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.163.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.163.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.163.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.164.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.164.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.164.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.164.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.164.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.164.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.165.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.165.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.165.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.165.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.165.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.165.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.166.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.166.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.166.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.166.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.166.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.166.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.167.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.167.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.167.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.167.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.167.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.167.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.168.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.168.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.168.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.168.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.168.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.168.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.169.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.169.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.169.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.169.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.169.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.169.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.170.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.170.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.170.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.170.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.170.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.170.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.171.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.171.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.171.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.171.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.171.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.171.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.172.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.172.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.172.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.172.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.172.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.172.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.173.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.173.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.173.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.173.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.173.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.173.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.174.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.174.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.174.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.174.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.174.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.174.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.175.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.175.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.175.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.175.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.175.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.175.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.176.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.176.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.176.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.176.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.176.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.176.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.177.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.177.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.177.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.177.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.177.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.177.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.178.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.178.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.178.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.178.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.178.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.178.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.179.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.179.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.179.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.179.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.179.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.179.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.180.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.180.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.180.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.180.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.180.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.180.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.181.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.181.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.181.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.181.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.181.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.181.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.182.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.182.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.182.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.182.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.182.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.182.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.183.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.183.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.183.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.183.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.183.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.183.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.184.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.184.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.184.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.184.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.184.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.184.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.185.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.185.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.185.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.185.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.185.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.185.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.186.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.186.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.186.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.186.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.186.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.186.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.187.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.187.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.187.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.187.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.187.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.187.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.188.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.188.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.188.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.188.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.188.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.188.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.189.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.189.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.189.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.189.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.189.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.189.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.190.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.190.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.190.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.190.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.190.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.190.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.191.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.191.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.191.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.191.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.191.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.191.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.192.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.192.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.192.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.192.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.192.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.192.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.193.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.193.gate_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.193.up_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.193.up_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.193.down_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.193.down_proj.weight_scale_inv": "model-00008-of-000163.safetensors", "model.layers.5.mlp.experts.194.gate_proj.weight": "model-00008-of-000163.safetensors", - "model.layers.5.mlp.experts.194.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.194.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.194.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.194.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.194.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.195.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.195.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.195.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.195.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.195.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.195.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.196.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.196.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.196.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.196.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.196.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.196.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.197.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.197.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.197.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.197.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.197.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.197.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.198.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.198.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.198.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.198.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.198.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.198.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.199.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.199.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.199.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.199.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.199.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.199.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.200.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.200.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.200.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.200.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.200.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.200.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.201.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.201.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.201.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.201.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.201.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.201.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.202.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.202.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.202.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.202.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.202.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.202.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.203.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.203.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.203.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.203.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.203.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.203.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.204.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.204.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.204.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.204.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.204.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.204.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.205.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.205.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.205.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.205.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.205.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.205.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.206.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.206.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.206.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.206.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.206.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.206.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.207.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.207.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.207.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.207.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.207.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.207.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.208.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.208.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.208.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.208.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.208.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.208.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.209.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.209.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.209.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.209.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.209.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.209.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.210.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.210.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.210.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.210.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.210.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.210.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.211.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.211.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.211.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.211.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.211.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.211.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.212.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.212.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.212.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.212.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.212.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.212.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.213.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.213.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.213.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.213.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.213.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.213.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.214.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.214.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.214.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.214.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.214.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.214.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.215.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.215.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.215.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.215.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.215.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.215.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.216.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.216.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.216.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.216.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.216.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.216.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.217.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.217.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.217.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.217.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.217.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.217.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.218.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.218.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.218.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.218.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.218.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.218.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.219.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.219.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.219.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.219.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.219.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.219.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.220.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.220.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.220.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.220.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.220.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.220.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.221.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.221.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.221.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.221.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.221.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.221.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.222.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.222.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.222.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.222.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.222.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.222.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.223.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.223.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.223.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.223.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.223.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.223.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.224.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.224.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.224.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.224.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.224.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.224.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.225.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.225.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.225.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.225.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.225.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.225.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.226.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.226.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.226.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.226.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.226.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.226.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.227.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.227.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.227.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.227.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.227.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.227.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.228.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.228.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.228.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.228.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.228.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.228.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.229.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.229.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.229.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.229.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.229.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.229.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.230.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.230.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.230.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.230.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.230.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.230.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.231.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.231.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.231.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.231.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.231.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.231.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.232.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.232.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.232.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.232.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.232.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.232.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.233.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.233.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.233.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.233.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.233.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.233.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.234.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.234.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.234.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.234.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.234.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.234.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.235.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.235.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.235.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.235.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.235.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.235.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.236.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.236.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.236.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.236.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.236.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.236.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.237.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.237.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.237.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.237.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.237.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.237.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.238.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.238.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.238.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.238.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.238.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.238.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.239.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.239.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.239.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.239.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.239.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.239.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.240.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.240.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.240.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.240.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.240.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.240.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.241.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.241.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.241.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.241.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.241.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.241.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.242.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.242.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.242.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.242.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.242.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.242.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.243.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.243.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.243.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.243.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.243.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.243.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.244.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.244.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.244.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.244.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.244.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.244.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.245.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.245.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.245.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.245.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.245.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.245.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.246.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.246.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.246.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.246.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.246.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.246.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.247.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.247.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.247.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.247.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.247.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.247.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.248.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.248.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.248.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.248.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.248.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.248.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.249.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.249.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.249.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.249.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.249.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.249.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.250.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.250.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.250.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.250.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.250.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.250.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.251.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.251.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.251.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.251.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.251.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.251.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.252.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.252.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.252.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.252.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.252.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.252.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.253.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.253.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.253.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.253.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.253.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.253.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.254.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.254.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.254.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.254.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.254.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.254.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.255.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.255.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.255.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.255.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.mlp.experts.255.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.5.mlp.experts.255.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.5.input_layernorm.weight": "model-00009-of-000163.safetensors", "model.layers.5.post_attention_layernorm.weight": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.q_a_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.self_attn.q_a_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.q_a_layernorm.weight": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.q_b_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.self_attn.q_b_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.kv_a_proj_with_mqa.weight": "model-00009-of-000163.safetensors", - "model.layers.6.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.kv_a_layernorm.weight": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.kv_b_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.self_attn.kv_b_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.self_attn.o_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.self_attn.o_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.gate.weight": "model-00009-of-000163.safetensors", "model.layers.6.mlp.gate.e_score_correction_bias": "model-00009-of-000163.safetensors", "model.layers.6.mlp.shared_experts.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.shared_experts.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.shared_experts.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.shared_experts.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.shared_experts.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.0.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.0.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.0.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.0.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.0.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.0.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.1.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.1.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.1.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.1.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.1.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.1.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.2.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.2.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.2.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.2.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.2.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.2.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.3.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.3.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.3.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.3.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.3.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.3.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.4.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.4.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.4.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.4.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.4.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.4.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.5.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.5.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.5.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.5.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.5.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.5.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.6.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.6.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.6.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.6.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.6.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.6.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.7.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.7.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.7.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.7.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.7.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.7.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.8.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.8.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.8.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.8.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.8.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.8.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.9.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.9.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.9.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.9.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.9.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.9.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.10.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.10.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.10.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.10.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.10.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.10.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.11.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.11.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.11.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.11.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.11.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.11.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.12.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.12.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.12.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.12.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.12.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.12.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.13.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.13.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.13.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.13.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.13.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.13.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.14.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.14.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.14.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.14.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.14.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.14.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.15.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.15.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.15.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.15.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.15.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.15.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.16.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.16.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.16.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.16.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.16.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.16.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.17.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.17.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.17.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.17.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.17.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.17.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.18.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.18.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.18.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.18.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.18.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.18.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.19.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.19.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.19.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.19.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.19.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.19.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.20.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.20.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.20.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.20.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.20.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.20.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.21.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.21.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.21.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.21.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.21.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.21.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.22.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.22.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.22.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.22.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.22.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.22.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.23.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.23.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.23.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.23.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.23.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.23.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.24.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.24.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.24.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.24.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.24.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.24.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.25.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.25.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.25.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.25.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.25.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.25.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.26.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.26.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.26.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.26.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.26.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.26.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.27.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.27.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.27.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.27.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.27.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.27.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.28.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.28.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.28.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.28.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.28.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.28.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.29.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.29.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.29.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.29.up_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.29.down_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.29.down_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.30.gate_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.30.gate_proj.weight_scale_inv": "model-00009-of-000163.safetensors", "model.layers.6.mlp.experts.30.up_proj.weight": "model-00009-of-000163.safetensors", - "model.layers.6.mlp.experts.30.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.30.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.30.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.31.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.31.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.31.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.31.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.31.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.31.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.32.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.32.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.32.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.32.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.32.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.32.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.33.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.33.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.33.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.33.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.33.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.33.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.34.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.34.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.34.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.34.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.34.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.34.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.35.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.35.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.35.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.35.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.35.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.35.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.36.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.36.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.36.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.36.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.36.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.36.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.37.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.37.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.37.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.37.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.37.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.37.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.38.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.38.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.38.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.38.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.38.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.38.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.39.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.39.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.39.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.39.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.39.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.39.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.40.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.40.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.40.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.40.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.40.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.40.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.41.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.41.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.41.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.41.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.41.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.41.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.42.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.42.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.42.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.42.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.42.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.42.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.43.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.43.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.43.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.43.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.43.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.43.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.44.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.44.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.44.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.44.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.44.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.44.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.45.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.45.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.45.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.45.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.45.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.45.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.46.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.46.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.46.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.46.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.46.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.46.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.47.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.47.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.47.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.47.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.47.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.47.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.48.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.48.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.48.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.48.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.48.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.48.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.49.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.49.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.49.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.49.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.49.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.49.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.50.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.50.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.50.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.50.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.50.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.50.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.51.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.51.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.51.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.51.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.51.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.51.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.52.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.52.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.52.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.52.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.52.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.52.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.53.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.53.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.53.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.53.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.53.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.53.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.54.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.54.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.54.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.54.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.54.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.54.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.55.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.55.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.55.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.55.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.55.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.55.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.56.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.56.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.56.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.56.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.56.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.56.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.57.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.57.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.57.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.57.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.57.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.57.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.58.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.58.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.58.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.58.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.58.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.58.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.59.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.59.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.59.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.59.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.59.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.59.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.60.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.60.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.60.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.60.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.60.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.60.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.61.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.61.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.61.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.61.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.61.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.61.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.62.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.62.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.62.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.62.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.62.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.62.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.63.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.63.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.63.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.63.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.63.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.63.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.64.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.64.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.64.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.64.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.64.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.64.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.65.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.65.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.65.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.65.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.65.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.65.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.66.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.66.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.66.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.66.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.66.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.66.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.67.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.67.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.67.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.67.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.67.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.67.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.68.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.68.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.68.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.68.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.68.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.68.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.69.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.69.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.69.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.69.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.69.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.69.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.70.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.70.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.70.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.70.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.70.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.70.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.71.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.71.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.71.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.71.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.71.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.71.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.72.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.72.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.72.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.72.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.72.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.72.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.73.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.73.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.73.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.73.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.73.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.73.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.74.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.74.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.74.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.74.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.74.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.74.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.75.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.75.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.75.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.75.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.75.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.75.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.76.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.76.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.76.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.76.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.76.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.76.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.77.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.77.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.77.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.77.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.77.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.77.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.78.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.78.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.78.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.78.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.78.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.78.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.79.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.79.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.79.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.79.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.79.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.79.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.80.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.80.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.80.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.80.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.80.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.80.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.81.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.81.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.81.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.81.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.81.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.81.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.82.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.82.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.82.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.82.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.82.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.82.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.83.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.83.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.83.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.83.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.83.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.83.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.84.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.84.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.84.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.84.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.84.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.84.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.85.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.85.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.85.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.85.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.85.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.85.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.86.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.86.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.86.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.86.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.86.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.86.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.87.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.87.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.87.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.87.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.87.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.87.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.88.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.88.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.88.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.88.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.88.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.88.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.89.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.89.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.89.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.89.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.89.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.89.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.90.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.90.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.90.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.90.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.90.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.90.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.91.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.91.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.91.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.91.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.91.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.91.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.92.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.92.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.92.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.92.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.92.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.92.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.93.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.93.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.93.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.93.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.93.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.93.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.94.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.94.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.94.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.94.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.94.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.94.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.95.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.95.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.95.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.95.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.95.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.95.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.96.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.96.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.96.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.96.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.96.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.96.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.97.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.97.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.97.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.97.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.97.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.97.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.98.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.98.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.98.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.98.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.98.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.98.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.99.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.99.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.99.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.99.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.99.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.99.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.100.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.100.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.100.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.100.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.100.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.100.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.101.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.101.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.101.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.101.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.101.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.101.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.102.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.102.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.102.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.102.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.102.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.102.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.103.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.103.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.103.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.103.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.103.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.103.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.104.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.104.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.104.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.104.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.104.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.104.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.105.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.105.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.105.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.105.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.105.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.105.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.106.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.106.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.106.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.106.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.106.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.106.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.107.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.107.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.107.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.107.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.107.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.107.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.108.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.108.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.108.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.108.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.108.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.108.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.109.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.109.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.109.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.109.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.109.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.109.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.110.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.110.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.110.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.110.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.110.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.110.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.111.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.111.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.111.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.111.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.111.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.111.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.112.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.112.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.112.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.112.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.112.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.112.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.113.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.113.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.113.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.113.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.113.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.113.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.114.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.114.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.114.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.114.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.114.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.114.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.115.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.115.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.115.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.115.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.115.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.115.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.116.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.116.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.116.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.116.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.116.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.116.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.117.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.117.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.117.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.117.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.117.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.117.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.118.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.118.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.118.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.118.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.118.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.118.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.119.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.119.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.119.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.119.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.119.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.119.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.120.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.120.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.120.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.120.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.120.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.120.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.121.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.121.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.121.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.121.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.121.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.121.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.122.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.122.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.122.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.122.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.122.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.122.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.123.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.123.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.123.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.123.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.123.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.123.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.124.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.124.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.124.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.124.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.124.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.124.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.125.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.125.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.125.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.125.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.125.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.125.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.126.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.126.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.126.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.126.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.126.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.126.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.127.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.127.gate_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.127.up_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.127.up_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.127.down_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.127.down_proj.weight_scale_inv": "model-00010-of-000163.safetensors", "model.layers.6.mlp.experts.128.gate_proj.weight": "model-00010-of-000163.safetensors", - "model.layers.6.mlp.experts.128.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.128.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.128.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.128.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.128.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.129.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.129.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.129.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.129.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.129.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.129.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.130.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.130.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.130.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.130.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.130.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.130.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.131.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.131.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.131.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.131.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.131.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.131.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.132.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.132.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.132.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.132.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.132.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.132.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.133.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.133.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.133.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.133.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.133.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.133.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.134.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.134.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.134.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.134.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.134.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.134.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.135.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.135.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.135.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.135.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.135.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.135.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.136.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.136.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.136.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.136.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.136.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.136.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.137.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.137.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.137.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.137.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.137.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.137.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.138.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.138.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.138.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.138.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.138.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.138.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.139.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.139.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.139.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.139.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.139.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.139.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.140.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.140.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.140.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.140.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.140.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.140.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.141.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.141.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.141.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.141.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.141.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.141.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.142.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.142.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.142.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.142.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.142.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.142.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.143.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.143.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.143.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.143.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.143.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.143.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.144.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.144.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.144.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.144.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.144.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.144.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.145.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.145.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.145.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.145.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.145.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.145.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.146.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.146.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.146.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.146.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.146.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.146.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.147.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.147.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.147.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.147.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.147.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.147.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.148.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.148.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.148.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.148.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.148.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.148.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.149.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.149.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.149.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.149.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.149.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.149.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.150.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.150.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.150.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.150.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.150.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.150.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.151.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.151.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.151.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.151.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.151.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.151.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.152.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.152.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.152.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.152.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.152.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.152.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.153.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.153.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.153.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.153.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.153.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.153.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.154.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.154.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.154.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.154.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.154.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.154.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.155.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.155.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.155.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.155.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.155.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.155.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.156.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.156.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.156.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.156.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.156.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.156.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.157.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.157.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.157.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.157.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.157.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.157.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.158.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.158.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.158.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.158.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.158.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.158.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.159.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.159.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.159.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.159.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.159.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.159.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.160.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.160.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.160.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.160.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.160.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.160.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.161.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.161.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.161.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.161.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.161.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.161.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.162.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.162.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.162.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.162.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.162.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.162.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.163.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.163.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.163.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.163.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.163.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.163.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.164.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.164.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.164.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.164.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.164.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.164.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.165.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.165.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.165.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.165.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.165.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.165.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.166.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.166.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.166.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.166.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.166.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.166.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.167.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.167.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.167.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.167.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.167.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.167.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.168.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.168.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.168.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.168.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.168.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.168.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.169.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.169.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.169.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.169.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.169.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.169.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.170.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.170.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.170.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.170.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.170.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.170.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.171.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.171.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.171.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.171.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.171.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.171.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.172.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.172.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.172.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.172.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.172.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.172.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.173.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.173.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.173.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.173.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.173.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.173.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.174.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.174.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.174.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.174.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.174.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.174.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.175.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.175.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.175.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.175.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.175.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.175.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.176.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.176.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.176.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.176.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.176.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.176.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.177.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.177.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.177.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.177.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.177.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.177.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.178.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.178.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.178.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.178.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.178.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.178.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.179.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.179.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.179.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.179.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.179.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.179.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.180.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.180.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.180.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.180.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.180.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.180.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.181.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.181.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.181.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.181.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.181.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.181.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.182.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.182.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.182.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.182.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.182.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.182.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.183.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.183.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.183.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.183.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.183.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.183.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.184.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.184.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.184.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.184.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.184.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.184.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.185.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.185.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.185.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.185.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.185.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.185.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.186.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.186.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.186.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.186.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.186.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.186.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.187.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.187.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.187.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.187.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.187.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.187.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.188.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.188.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.188.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.188.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.188.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.188.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.189.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.189.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.189.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.189.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.189.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.189.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.190.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.190.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.190.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.190.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.190.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.190.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.191.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.191.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.191.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.191.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.191.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.191.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.192.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.192.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.192.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.192.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.192.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.192.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.193.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.193.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.193.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.193.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.193.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.193.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.194.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.194.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.194.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.194.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.194.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.194.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.195.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.195.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.195.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.195.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.195.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.195.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.196.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.196.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.196.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.196.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.196.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.196.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.197.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.197.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.197.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.197.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.197.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.197.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.198.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.198.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.198.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.198.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.198.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.198.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.199.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.199.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.199.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.199.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.199.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.199.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.200.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.200.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.200.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.200.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.200.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.200.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.201.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.201.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.201.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.201.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.201.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.201.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.202.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.202.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.202.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.202.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.202.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.202.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.203.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.203.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.203.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.203.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.203.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.203.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.204.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.204.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.204.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.204.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.204.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.204.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.205.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.205.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.205.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.205.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.205.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.205.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.206.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.206.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.206.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.206.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.206.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.206.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.207.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.207.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.207.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.207.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.207.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.207.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.208.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.208.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.208.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.208.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.208.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.208.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.209.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.209.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.209.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.209.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.209.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.209.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.210.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.210.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.210.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.210.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.210.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.210.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.211.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.211.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.211.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.211.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.211.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.211.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.212.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.212.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.212.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.212.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.212.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.212.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.213.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.213.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.213.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.213.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.213.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.213.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.214.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.214.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.214.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.214.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.214.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.214.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.215.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.215.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.215.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.215.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.215.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.215.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.216.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.216.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.216.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.216.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.216.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.216.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.217.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.217.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.217.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.217.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.217.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.217.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.218.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.218.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.218.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.218.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.218.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.218.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.219.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.219.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.219.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.219.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.219.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.219.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.220.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.220.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.220.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.220.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.220.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.220.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.221.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.221.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.221.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.221.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.221.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.221.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.222.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.222.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.222.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.222.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.222.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.222.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.223.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.223.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.223.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.223.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.223.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.223.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.224.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.224.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.224.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.224.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.224.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.224.down_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.225.gate_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.225.gate_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.225.up_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.225.up_proj.weight_scale_inv": "model-00011-of-000163.safetensors", "model.layers.6.mlp.experts.225.down_proj.weight": "model-00011-of-000163.safetensors", - "model.layers.6.mlp.experts.225.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.226.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.226.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.226.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.226.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.226.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.226.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.227.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.227.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.227.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.227.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.227.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.227.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.228.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.228.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.228.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.228.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.228.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.228.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.229.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.229.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.229.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.229.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.229.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.229.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.230.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.230.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.230.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.230.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.230.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.230.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.231.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.231.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.231.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.231.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.231.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.231.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.232.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.232.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.232.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.232.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.232.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.232.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.233.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.233.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.233.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.233.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.233.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.233.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.234.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.234.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.234.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.234.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.234.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.234.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.235.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.235.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.235.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.235.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.235.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.235.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.236.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.236.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.236.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.236.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.236.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.236.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.237.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.237.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.237.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.237.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.237.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.237.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.238.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.238.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.238.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.238.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.238.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.238.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.239.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.239.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.239.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.239.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.239.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.239.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.240.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.240.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.240.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.240.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.240.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.240.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.241.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.241.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.241.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.241.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.241.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.241.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.242.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.242.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.242.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.242.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.242.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.242.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.243.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.243.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.243.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.243.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.243.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.243.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.244.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.244.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.244.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.244.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.244.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.244.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.245.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.245.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.245.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.245.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.245.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.245.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.246.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.246.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.246.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.246.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.246.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.246.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.247.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.247.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.247.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.247.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.247.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.247.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.248.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.248.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.248.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.248.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.248.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.248.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.249.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.249.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.249.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.249.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.249.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.249.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.250.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.250.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.250.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.250.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.250.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.250.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.251.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.251.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.251.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.251.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.251.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.251.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.252.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.252.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.252.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.252.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.252.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.252.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.253.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.253.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.253.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.253.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.253.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.253.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.254.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.254.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.254.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.254.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.254.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.254.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.255.gate_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.255.gate_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.255.up_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.255.up_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.mlp.experts.255.down_proj.weight": "model-00012-of-000163.safetensors", - "model.layers.6.mlp.experts.255.down_proj.weight_scale_inv": "model-00012-of-000163.safetensors", "model.layers.6.input_layernorm.weight": "model-00012-of-000163.safetensors", "model.layers.6.post_attention_layernorm.weight": "model-00012-of-000163.safetensors", "model.layers.7.self_attn.q_a_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.self_attn.q_a_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.q_a_layernorm.weight": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.q_b_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.self_attn.q_b_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.kv_a_proj_with_mqa.weight": "model-00013-of-000163.safetensors", - "model.layers.7.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.kv_a_layernorm.weight": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.kv_b_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.self_attn.kv_b_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.self_attn.o_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.self_attn.o_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.gate.weight": "model-00013-of-000163.safetensors", "model.layers.7.mlp.gate.e_score_correction_bias": "model-00013-of-000163.safetensors", "model.layers.7.mlp.shared_experts.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.shared_experts.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.shared_experts.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.shared_experts.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.shared_experts.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.0.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.0.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.0.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.0.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.0.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.0.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.1.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.1.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.1.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.1.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.1.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.1.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.2.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.2.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.2.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.2.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.2.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.2.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.3.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.3.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.3.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.3.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.3.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.3.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.4.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.4.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.4.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.4.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.4.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.4.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.5.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.5.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.5.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.5.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.5.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.5.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.6.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.6.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.6.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.6.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.6.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.6.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.7.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.7.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.7.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.7.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.7.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.7.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.8.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.8.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.8.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.8.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.8.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.8.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.9.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.9.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.9.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.9.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.9.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.9.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.10.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.10.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.10.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.10.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.10.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.10.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.11.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.11.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.11.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.11.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.11.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.11.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.12.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.12.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.12.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.12.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.12.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.12.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.13.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.13.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.13.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.13.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.13.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.13.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.14.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.14.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.14.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.14.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.14.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.14.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.15.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.15.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.15.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.15.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.15.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.15.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.16.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.16.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.16.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.16.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.16.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.16.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.17.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.17.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.17.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.17.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.17.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.17.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.18.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.18.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.18.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.18.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.18.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.18.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.19.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.19.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.19.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.19.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.19.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.19.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.20.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.20.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.20.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.20.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.20.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.20.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.21.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.21.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.21.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.21.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.21.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.21.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.22.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.22.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.22.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.22.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.22.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.22.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.23.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.23.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.23.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.23.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.23.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.23.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.24.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.24.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.24.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.24.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.24.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.24.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.25.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.25.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.25.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.25.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.25.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.25.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.26.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.26.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.26.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.26.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.26.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.26.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.27.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.27.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.27.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.27.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.27.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.27.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.28.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.28.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.28.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.28.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.28.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.28.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.29.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.29.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.29.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.29.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.29.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.29.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.30.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.30.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.30.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.30.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.30.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.30.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.31.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.31.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.31.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.31.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.31.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.31.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.32.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.32.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.32.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.32.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.32.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.32.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.33.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.33.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.33.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.33.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.33.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.33.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.34.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.34.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.34.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.34.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.34.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.34.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.35.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.35.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.35.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.35.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.35.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.35.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.36.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.36.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.36.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.36.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.36.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.36.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.37.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.37.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.37.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.37.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.37.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.37.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.38.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.38.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.38.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.38.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.38.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.38.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.39.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.39.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.39.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.39.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.39.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.39.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.40.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.40.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.40.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.40.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.40.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.40.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.41.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.41.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.41.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.41.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.41.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.41.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.42.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.42.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.42.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.42.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.42.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.42.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.43.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.43.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.43.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.43.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.43.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.43.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.44.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.44.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.44.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.44.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.44.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.44.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.45.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.45.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.45.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.45.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.45.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.45.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.46.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.46.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.46.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.46.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.46.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.46.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.47.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.47.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.47.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.47.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.47.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.47.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.48.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.48.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.48.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.48.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.48.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.48.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.49.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.49.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.49.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.49.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.49.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.49.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.50.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.50.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.50.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.50.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.50.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.50.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.51.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.51.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.51.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.51.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.51.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.51.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.52.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.52.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.52.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.52.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.52.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.52.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.53.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.53.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.53.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.53.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.53.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.53.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.54.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.54.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.54.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.54.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.54.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.54.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.55.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.55.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.55.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.55.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.55.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.55.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.56.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.56.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.56.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.56.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.56.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.56.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.57.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.57.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.57.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.57.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.57.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.57.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.58.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.58.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.58.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.58.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.58.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.58.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.59.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.59.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.59.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.59.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.59.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.59.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.60.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.60.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.60.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.60.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.60.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.60.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.61.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.61.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.61.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.61.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.61.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.61.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.62.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.62.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.62.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.62.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.62.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.62.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.63.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.63.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.63.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.63.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.63.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.63.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.64.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.64.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.64.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.64.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.64.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.64.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.65.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.65.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.65.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.65.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.65.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.65.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.66.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.66.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.66.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.66.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.66.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.66.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.67.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.67.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.67.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.67.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.67.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.67.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.68.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.68.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.68.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.68.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.68.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.68.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.69.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.69.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.69.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.69.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.69.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.69.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.70.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.70.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.70.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.70.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.70.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.70.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.71.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.71.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.71.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.71.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.71.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.71.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.72.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.72.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.72.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.72.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.72.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.72.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.73.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.73.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.73.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.73.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.73.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.73.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.74.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.74.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.74.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.74.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.74.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.74.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.75.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.75.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.75.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.75.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.75.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.75.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.76.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.76.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.76.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.76.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.76.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.76.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.77.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.77.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.77.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.77.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.77.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.77.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.78.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.78.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.78.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.78.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.78.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.78.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.79.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.79.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.79.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.79.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.79.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.79.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.80.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.80.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.80.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.80.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.80.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.80.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.81.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.81.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.81.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.81.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.81.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.81.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.82.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.82.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.82.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.82.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.82.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.82.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.83.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.83.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.83.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.83.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.83.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.83.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.84.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.84.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.84.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.84.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.84.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.84.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.85.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.85.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.85.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.85.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.85.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.85.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.86.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.86.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.86.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.86.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.86.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.86.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.87.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.87.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.87.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.87.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.87.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.87.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.88.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.88.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.88.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.88.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.88.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.88.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.89.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.89.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.89.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.89.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.89.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.89.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.90.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.90.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.90.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.90.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.90.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.90.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.91.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.91.gate_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.91.up_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.91.up_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.91.down_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.91.down_proj.weight_scale_inv": "model-00013-of-000163.safetensors", "model.layers.7.mlp.experts.92.gate_proj.weight": "model-00013-of-000163.safetensors", - "model.layers.7.mlp.experts.92.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.92.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.92.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.92.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.92.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.93.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.93.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.93.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.93.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.93.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.93.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.94.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.94.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.94.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.94.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.94.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.94.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.95.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.95.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.95.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.95.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.95.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.95.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.96.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.96.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.96.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.96.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.96.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.96.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.97.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.97.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.97.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.97.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.97.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.97.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.98.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.98.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.98.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.98.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.98.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.98.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.99.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.99.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.99.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.99.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.99.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.99.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.100.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.100.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.100.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.100.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.100.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.100.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.101.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.101.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.101.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.101.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.101.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.101.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.102.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.102.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.102.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.102.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.102.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.102.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.103.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.103.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.103.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.103.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.103.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.103.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.104.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.104.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.104.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.104.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.104.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.104.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.105.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.105.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.105.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.105.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.105.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.105.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.106.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.106.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.106.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.106.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.106.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.106.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.107.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.107.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.107.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.107.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.107.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.107.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.108.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.108.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.108.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.108.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.108.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.108.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.109.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.109.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.109.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.109.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.109.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.109.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.110.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.110.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.110.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.110.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.110.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.110.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.111.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.111.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.111.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.111.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.111.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.111.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.112.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.112.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.112.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.112.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.112.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.112.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.113.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.113.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.113.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.113.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.113.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.113.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.114.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.114.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.114.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.114.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.114.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.114.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.115.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.115.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.115.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.115.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.115.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.115.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.116.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.116.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.116.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.116.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.116.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.116.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.117.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.117.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.117.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.117.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.117.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.117.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.118.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.118.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.118.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.118.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.118.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.118.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.119.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.119.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.119.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.119.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.119.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.119.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.120.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.120.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.120.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.120.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.120.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.120.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.121.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.121.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.121.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.121.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.121.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.121.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.122.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.122.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.122.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.122.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.122.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.122.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.123.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.123.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.123.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.123.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.123.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.123.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.124.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.124.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.124.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.124.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.124.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.124.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.125.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.125.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.125.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.125.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.125.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.125.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.126.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.126.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.126.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.126.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.126.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.126.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.127.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.127.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.127.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.127.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.127.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.127.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.128.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.128.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.128.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.128.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.128.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.128.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.129.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.129.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.129.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.129.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.129.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.129.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.130.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.130.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.130.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.130.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.130.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.130.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.131.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.131.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.131.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.131.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.131.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.131.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.132.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.132.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.132.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.132.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.132.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.132.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.133.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.133.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.133.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.133.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.133.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.133.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.134.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.134.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.134.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.134.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.134.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.134.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.135.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.135.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.135.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.135.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.135.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.135.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.136.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.136.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.136.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.136.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.136.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.136.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.137.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.137.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.137.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.137.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.137.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.137.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.138.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.138.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.138.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.138.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.138.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.138.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.139.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.139.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.139.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.139.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.139.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.139.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.140.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.140.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.140.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.140.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.140.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.140.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.141.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.141.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.141.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.141.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.141.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.141.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.142.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.142.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.142.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.142.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.142.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.142.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.143.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.143.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.143.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.143.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.143.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.143.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.144.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.144.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.144.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.144.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.144.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.144.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.145.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.145.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.145.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.145.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.145.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.145.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.146.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.146.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.146.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.146.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.146.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.146.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.147.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.147.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.147.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.147.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.147.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.147.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.148.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.148.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.148.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.148.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.148.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.148.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.149.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.149.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.149.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.149.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.149.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.149.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.150.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.150.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.150.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.150.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.150.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.150.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.151.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.151.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.151.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.151.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.151.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.151.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.152.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.152.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.152.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.152.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.152.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.152.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.153.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.153.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.153.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.153.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.153.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.153.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.154.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.154.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.154.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.154.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.154.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.154.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.155.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.155.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.155.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.155.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.155.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.155.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.156.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.156.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.156.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.156.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.156.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.156.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.157.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.157.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.157.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.157.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.157.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.157.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.158.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.158.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.158.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.158.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.158.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.158.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.159.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.159.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.159.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.159.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.159.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.159.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.160.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.160.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.160.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.160.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.160.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.160.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.161.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.161.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.161.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.161.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.161.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.161.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.162.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.162.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.162.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.162.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.162.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.162.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.163.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.163.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.163.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.163.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.163.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.163.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.164.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.164.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.164.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.164.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.164.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.164.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.165.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.165.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.165.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.165.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.165.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.165.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.166.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.166.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.166.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.166.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.166.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.166.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.167.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.167.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.167.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.167.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.167.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.167.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.168.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.168.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.168.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.168.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.168.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.168.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.169.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.169.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.169.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.169.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.169.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.169.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.170.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.170.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.170.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.170.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.170.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.170.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.171.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.171.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.171.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.171.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.171.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.171.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.172.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.172.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.172.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.172.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.172.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.172.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.173.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.173.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.173.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.173.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.173.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.173.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.174.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.174.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.174.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.174.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.174.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.174.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.175.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.175.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.175.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.175.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.175.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.175.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.176.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.176.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.176.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.176.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.176.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.176.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.177.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.177.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.177.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.177.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.177.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.177.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.178.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.178.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.178.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.178.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.178.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.178.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.179.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.179.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.179.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.179.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.179.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.179.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.180.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.180.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.180.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.180.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.180.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.180.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.181.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.181.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.181.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.181.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.181.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.181.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.182.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.182.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.182.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.182.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.182.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.182.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.183.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.183.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.183.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.183.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.183.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.183.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.184.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.184.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.184.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.184.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.184.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.184.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.185.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.185.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.185.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.185.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.185.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.185.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.186.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.186.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.186.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.186.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.186.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.186.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.187.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.187.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.187.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.187.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.187.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.187.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.188.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.188.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.188.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.188.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.188.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.188.down_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.189.gate_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.189.gate_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.189.up_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.189.up_proj.weight_scale_inv": "model-00014-of-000163.safetensors", "model.layers.7.mlp.experts.189.down_proj.weight": "model-00014-of-000163.safetensors", - "model.layers.7.mlp.experts.189.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.190.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.190.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.190.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.190.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.190.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.190.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.191.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.191.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.191.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.191.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.191.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.191.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.192.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.192.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.192.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.192.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.192.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.192.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.193.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.193.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.193.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.193.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.193.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.193.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.194.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.194.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.194.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.194.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.194.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.194.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.195.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.195.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.195.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.195.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.195.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.195.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.196.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.196.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.196.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.196.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.196.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.196.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.197.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.197.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.197.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.197.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.197.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.197.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.198.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.198.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.198.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.198.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.198.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.198.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.199.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.199.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.199.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.199.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.199.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.199.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.200.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.200.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.200.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.200.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.200.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.200.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.201.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.201.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.201.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.201.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.201.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.201.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.202.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.202.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.202.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.202.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.202.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.202.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.203.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.203.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.203.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.203.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.203.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.203.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.204.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.204.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.204.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.204.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.204.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.204.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.205.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.205.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.205.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.205.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.205.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.205.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.206.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.206.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.206.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.206.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.206.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.206.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.207.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.207.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.207.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.207.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.207.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.207.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.208.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.208.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.208.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.208.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.208.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.208.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.209.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.209.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.209.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.209.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.209.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.209.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.210.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.210.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.210.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.210.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.210.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.210.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.211.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.211.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.211.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.211.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.211.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.211.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.212.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.212.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.212.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.212.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.212.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.212.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.213.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.213.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.213.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.213.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.213.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.213.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.214.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.214.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.214.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.214.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.214.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.214.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.215.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.215.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.215.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.215.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.215.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.215.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.216.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.216.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.216.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.216.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.216.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.216.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.217.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.217.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.217.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.217.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.217.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.217.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.218.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.218.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.218.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.218.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.218.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.218.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.219.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.219.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.219.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.219.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.219.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.219.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.220.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.220.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.220.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.220.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.220.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.220.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.221.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.221.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.221.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.221.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.221.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.221.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.222.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.222.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.222.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.222.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.222.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.222.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.223.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.223.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.223.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.223.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.223.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.223.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.224.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.224.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.224.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.224.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.224.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.224.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.225.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.225.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.225.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.225.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.225.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.225.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.226.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.226.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.226.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.226.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.226.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.226.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.227.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.227.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.227.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.227.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.227.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.227.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.228.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.228.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.228.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.228.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.228.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.228.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.229.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.229.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.229.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.229.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.229.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.229.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.230.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.230.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.230.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.230.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.230.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.230.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.231.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.231.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.231.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.231.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.231.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.231.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.232.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.232.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.232.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.232.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.232.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.232.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.233.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.233.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.233.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.233.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.233.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.233.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.234.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.234.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.234.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.234.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.234.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.234.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.235.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.235.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.235.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.235.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.235.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.235.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.236.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.236.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.236.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.236.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.236.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.236.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.237.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.237.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.237.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.237.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.237.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.237.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.238.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.238.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.238.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.238.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.238.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.238.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.239.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.239.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.239.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.239.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.239.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.239.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.240.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.240.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.240.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.240.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.240.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.240.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.241.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.241.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.241.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.241.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.241.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.241.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.242.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.242.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.242.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.242.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.242.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.242.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.243.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.243.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.243.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.243.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.243.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.243.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.244.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.244.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.244.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.244.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.244.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.244.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.245.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.245.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.245.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.245.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.245.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.245.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.246.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.246.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.246.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.246.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.246.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.246.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.247.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.247.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.247.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.247.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.247.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.247.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.248.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.248.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.248.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.248.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.248.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.248.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.249.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.249.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.249.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.249.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.249.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.249.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.250.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.250.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.250.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.250.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.250.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.250.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.251.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.251.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.251.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.251.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.251.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.251.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.252.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.252.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.252.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.252.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.252.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.252.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.253.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.253.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.253.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.253.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.253.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.253.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.254.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.254.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.254.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.254.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.254.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.254.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.255.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.255.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.255.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.255.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.mlp.experts.255.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.7.mlp.experts.255.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.7.input_layernorm.weight": "model-00015-of-000163.safetensors", "model.layers.7.post_attention_layernorm.weight": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.q_a_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.self_attn.q_a_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.q_a_layernorm.weight": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.q_b_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.self_attn.q_b_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.kv_a_proj_with_mqa.weight": "model-00015-of-000163.safetensors", - "model.layers.8.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.kv_a_layernorm.weight": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.kv_b_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.self_attn.kv_b_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.self_attn.o_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.self_attn.o_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.gate.weight": "model-00015-of-000163.safetensors", "model.layers.8.mlp.gate.e_score_correction_bias": "model-00015-of-000163.safetensors", "model.layers.8.mlp.shared_experts.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.shared_experts.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.shared_experts.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.shared_experts.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.shared_experts.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.0.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.0.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.0.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.0.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.0.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.0.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.1.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.1.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.1.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.1.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.1.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.1.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.2.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.2.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.2.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.2.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.2.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.2.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.3.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.3.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.3.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.3.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.3.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.3.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.4.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.4.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.4.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.4.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.4.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.4.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.5.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.5.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.5.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.5.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.5.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.5.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.6.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.6.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.6.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.6.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.6.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.6.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.7.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.7.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.7.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.7.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.7.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.7.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.8.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.8.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.8.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.8.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.8.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.8.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.9.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.9.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.9.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.9.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.9.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.9.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.10.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.10.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.10.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.10.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.10.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.10.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.11.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.11.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.11.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.11.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.11.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.11.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.12.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.12.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.12.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.12.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.12.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.12.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.13.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.13.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.13.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.13.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.13.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.13.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.14.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.14.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.14.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.14.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.14.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.14.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.15.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.15.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.15.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.15.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.15.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.15.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.16.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.16.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.16.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.16.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.16.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.16.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.17.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.17.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.17.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.17.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.17.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.17.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.18.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.18.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.18.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.18.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.18.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.18.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.19.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.19.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.19.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.19.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.19.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.19.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.20.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.20.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.20.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.20.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.20.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.20.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.21.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.21.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.21.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.21.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.21.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.21.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.22.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.22.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.22.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.22.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.22.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.22.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.23.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.23.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.23.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.23.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.23.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.23.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.24.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.24.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.24.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.24.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.24.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.24.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.25.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.25.gate_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.25.up_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.25.up_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.25.down_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.25.down_proj.weight_scale_inv": "model-00015-of-000163.safetensors", "model.layers.8.mlp.experts.26.gate_proj.weight": "model-00015-of-000163.safetensors", - "model.layers.8.mlp.experts.26.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.26.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.26.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.26.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.26.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.27.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.27.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.27.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.27.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.27.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.27.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.28.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.28.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.28.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.28.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.28.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.28.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.29.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.29.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.29.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.29.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.29.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.29.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.30.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.30.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.30.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.30.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.30.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.30.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.31.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.31.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.31.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.31.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.31.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.31.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.32.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.32.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.32.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.32.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.32.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.32.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.33.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.33.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.33.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.33.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.33.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.33.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.34.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.34.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.34.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.34.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.34.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.34.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.35.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.35.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.35.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.35.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.35.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.35.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.36.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.36.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.36.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.36.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.36.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.36.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.37.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.37.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.37.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.37.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.37.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.37.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.38.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.38.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.38.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.38.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.38.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.38.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.39.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.39.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.39.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.39.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.39.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.39.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.40.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.40.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.40.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.40.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.40.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.40.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.41.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.41.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.41.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.41.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.41.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.41.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.42.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.42.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.42.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.42.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.42.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.42.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.43.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.43.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.43.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.43.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.43.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.43.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.44.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.44.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.44.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.44.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.44.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.44.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.45.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.45.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.45.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.45.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.45.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.45.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.46.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.46.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.46.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.46.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.46.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.46.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.47.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.47.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.47.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.47.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.47.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.47.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.48.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.48.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.48.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.48.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.48.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.48.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.49.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.49.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.49.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.49.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.49.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.49.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.50.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.50.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.50.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.50.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.50.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.50.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.51.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.51.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.51.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.51.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.51.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.51.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.52.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.52.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.52.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.52.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.52.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.52.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.53.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.53.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.53.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.53.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.53.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.53.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.54.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.54.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.54.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.54.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.54.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.54.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.55.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.55.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.55.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.55.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.55.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.55.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.56.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.56.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.56.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.56.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.56.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.56.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.57.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.57.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.57.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.57.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.57.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.57.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.58.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.58.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.58.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.58.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.58.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.58.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.59.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.59.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.59.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.59.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.59.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.59.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.60.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.60.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.60.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.60.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.60.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.60.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.61.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.61.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.61.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.61.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.61.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.61.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.62.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.62.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.62.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.62.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.62.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.62.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.63.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.63.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.63.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.63.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.63.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.63.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.64.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.64.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.64.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.64.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.64.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.64.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.65.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.65.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.65.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.65.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.65.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.65.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.66.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.66.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.66.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.66.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.66.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.66.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.67.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.67.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.67.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.67.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.67.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.67.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.68.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.68.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.68.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.68.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.68.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.68.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.69.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.69.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.69.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.69.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.69.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.69.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.70.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.70.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.70.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.70.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.70.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.70.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.71.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.71.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.71.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.71.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.71.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.71.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.72.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.72.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.72.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.72.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.72.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.72.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.73.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.73.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.73.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.73.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.73.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.73.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.74.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.74.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.74.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.74.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.74.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.74.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.75.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.75.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.75.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.75.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.75.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.75.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.76.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.76.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.76.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.76.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.76.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.76.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.77.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.77.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.77.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.77.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.77.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.77.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.78.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.78.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.78.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.78.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.78.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.78.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.79.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.79.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.79.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.79.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.79.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.79.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.80.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.80.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.80.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.80.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.80.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.80.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.81.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.81.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.81.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.81.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.81.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.81.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.82.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.82.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.82.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.82.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.82.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.82.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.83.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.83.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.83.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.83.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.83.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.83.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.84.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.84.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.84.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.84.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.84.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.84.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.85.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.85.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.85.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.85.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.85.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.85.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.86.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.86.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.86.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.86.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.86.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.86.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.87.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.87.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.87.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.87.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.87.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.87.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.88.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.88.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.88.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.88.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.88.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.88.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.89.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.89.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.89.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.89.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.89.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.89.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.90.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.90.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.90.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.90.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.90.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.90.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.91.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.91.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.91.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.91.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.91.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.91.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.92.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.92.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.92.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.92.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.92.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.92.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.93.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.93.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.93.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.93.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.93.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.93.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.94.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.94.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.94.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.94.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.94.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.94.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.95.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.95.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.95.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.95.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.95.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.95.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.96.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.96.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.96.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.96.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.96.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.96.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.97.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.97.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.97.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.97.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.97.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.97.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.98.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.98.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.98.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.98.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.98.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.98.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.99.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.99.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.99.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.99.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.99.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.99.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.100.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.100.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.100.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.100.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.100.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.100.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.101.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.101.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.101.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.101.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.101.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.101.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.102.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.102.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.102.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.102.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.102.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.102.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.103.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.103.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.103.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.103.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.103.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.103.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.104.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.104.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.104.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.104.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.104.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.104.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.105.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.105.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.105.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.105.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.105.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.105.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.106.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.106.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.106.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.106.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.106.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.106.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.107.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.107.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.107.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.107.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.107.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.107.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.108.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.108.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.108.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.108.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.108.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.108.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.109.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.109.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.109.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.109.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.109.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.109.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.110.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.110.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.110.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.110.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.110.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.110.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.111.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.111.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.111.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.111.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.111.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.111.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.112.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.112.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.112.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.112.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.112.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.112.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.113.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.113.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.113.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.113.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.113.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.113.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.114.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.114.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.114.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.114.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.114.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.114.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.115.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.115.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.115.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.115.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.115.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.115.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.116.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.116.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.116.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.116.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.116.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.116.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.117.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.117.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.117.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.117.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.117.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.117.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.118.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.118.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.118.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.118.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.118.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.118.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.119.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.119.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.119.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.119.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.119.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.119.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.120.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.120.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.120.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.120.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.120.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.120.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.121.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.121.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.121.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.121.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.121.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.121.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.122.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.122.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.122.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.122.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.122.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.122.down_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.123.gate_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.123.gate_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.123.up_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.123.up_proj.weight_scale_inv": "model-00016-of-000163.safetensors", "model.layers.8.mlp.experts.123.down_proj.weight": "model-00016-of-000163.safetensors", - "model.layers.8.mlp.experts.123.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.124.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.124.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.124.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.124.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.124.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.124.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.125.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.125.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.125.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.125.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.125.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.125.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.126.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.126.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.126.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.126.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.126.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.126.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.127.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.127.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.127.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.127.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.127.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.127.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.128.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.128.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.128.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.128.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.128.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.128.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.129.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.129.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.129.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.129.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.129.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.129.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.130.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.130.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.130.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.130.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.130.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.130.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.131.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.131.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.131.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.131.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.131.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.131.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.132.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.132.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.132.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.132.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.132.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.132.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.133.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.133.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.133.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.133.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.133.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.133.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.134.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.134.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.134.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.134.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.134.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.134.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.135.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.135.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.135.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.135.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.135.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.135.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.136.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.136.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.136.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.136.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.136.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.136.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.137.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.137.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.137.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.137.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.137.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.137.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.138.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.138.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.138.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.138.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.138.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.138.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.139.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.139.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.139.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.139.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.139.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.139.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.140.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.140.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.140.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.140.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.140.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.140.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.141.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.141.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.141.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.141.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.141.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.141.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.142.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.142.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.142.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.142.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.142.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.142.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.143.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.143.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.143.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.143.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.143.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.143.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.144.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.144.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.144.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.144.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.144.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.144.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.145.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.145.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.145.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.145.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.145.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.145.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.146.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.146.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.146.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.146.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.146.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.146.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.147.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.147.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.147.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.147.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.147.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.147.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.148.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.148.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.148.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.148.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.148.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.148.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.149.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.149.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.149.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.149.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.149.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.149.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.150.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.150.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.150.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.150.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.150.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.150.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.151.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.151.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.151.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.151.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.151.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.151.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.152.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.152.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.152.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.152.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.152.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.152.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.153.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.153.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.153.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.153.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.153.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.153.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.154.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.154.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.154.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.154.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.154.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.154.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.155.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.155.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.155.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.155.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.155.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.155.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.156.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.156.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.156.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.156.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.156.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.156.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.157.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.157.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.157.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.157.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.157.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.157.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.158.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.158.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.158.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.158.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.158.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.158.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.159.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.159.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.159.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.159.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.159.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.159.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.160.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.160.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.160.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.160.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.160.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.160.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.161.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.161.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.161.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.161.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.161.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.161.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.162.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.162.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.162.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.162.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.162.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.162.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.163.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.163.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.163.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.163.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.163.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.163.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.164.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.164.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.164.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.164.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.164.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.164.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.165.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.165.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.165.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.165.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.165.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.165.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.166.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.166.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.166.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.166.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.166.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.166.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.167.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.167.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.167.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.167.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.167.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.167.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.168.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.168.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.168.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.168.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.168.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.168.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.169.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.169.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.169.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.169.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.169.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.169.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.170.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.170.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.170.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.170.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.170.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.170.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.171.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.171.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.171.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.171.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.171.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.171.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.172.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.172.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.172.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.172.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.172.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.172.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.173.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.173.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.173.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.173.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.173.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.173.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.174.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.174.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.174.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.174.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.174.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.174.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.175.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.175.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.175.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.175.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.175.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.175.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.176.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.176.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.176.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.176.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.176.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.176.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.177.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.177.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.177.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.177.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.177.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.177.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.178.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.178.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.178.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.178.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.178.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.178.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.179.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.179.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.179.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.179.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.179.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.179.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.180.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.180.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.180.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.180.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.180.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.180.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.181.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.181.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.181.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.181.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.181.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.181.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.182.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.182.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.182.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.182.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.182.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.182.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.183.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.183.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.183.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.183.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.183.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.183.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.184.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.184.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.184.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.184.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.184.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.184.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.185.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.185.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.185.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.185.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.185.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.185.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.186.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.186.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.186.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.186.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.186.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.186.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.187.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.187.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.187.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.187.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.187.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.187.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.188.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.188.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.188.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.188.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.188.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.188.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.189.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.189.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.189.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.189.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.189.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.189.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.190.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.190.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.190.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.190.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.190.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.190.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.191.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.191.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.191.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.191.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.191.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.191.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.192.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.192.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.192.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.192.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.192.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.192.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.193.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.193.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.193.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.193.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.193.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.193.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.194.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.194.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.194.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.194.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.194.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.194.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.195.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.195.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.195.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.195.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.195.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.195.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.196.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.196.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.196.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.196.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.196.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.196.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.197.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.197.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.197.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.197.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.197.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.197.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.198.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.198.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.198.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.198.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.198.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.198.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.199.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.199.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.199.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.199.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.199.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.199.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.200.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.200.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.200.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.200.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.200.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.200.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.201.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.201.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.201.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.201.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.201.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.201.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.202.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.202.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.202.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.202.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.202.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.202.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.203.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.203.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.203.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.203.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.203.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.203.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.204.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.204.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.204.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.204.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.204.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.204.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.205.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.205.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.205.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.205.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.205.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.205.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.206.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.206.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.206.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.206.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.206.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.206.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.207.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.207.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.207.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.207.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.207.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.207.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.208.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.208.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.208.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.208.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.208.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.208.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.209.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.209.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.209.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.209.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.209.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.209.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.210.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.210.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.210.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.210.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.210.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.210.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.211.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.211.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.211.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.211.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.211.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.211.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.212.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.212.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.212.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.212.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.212.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.212.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.213.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.213.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.213.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.213.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.213.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.213.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.214.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.214.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.214.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.214.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.214.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.214.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.215.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.215.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.215.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.215.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.215.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.215.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.216.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.216.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.216.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.216.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.216.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.216.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.217.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.217.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.217.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.217.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.217.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.217.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.218.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.218.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.218.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.218.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.218.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.218.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.219.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.219.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.219.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.219.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.219.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.219.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.220.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.220.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.220.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.220.up_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.220.down_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.220.down_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.221.gate_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.221.gate_proj.weight_scale_inv": "model-00017-of-000163.safetensors", "model.layers.8.mlp.experts.221.up_proj.weight": "model-00017-of-000163.safetensors", - "model.layers.8.mlp.experts.221.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.221.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.221.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.222.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.222.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.222.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.222.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.222.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.222.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.223.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.223.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.223.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.223.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.223.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.223.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.224.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.224.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.224.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.224.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.224.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.224.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.225.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.225.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.225.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.225.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.225.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.225.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.226.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.226.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.226.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.226.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.226.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.226.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.227.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.227.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.227.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.227.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.227.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.227.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.228.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.228.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.228.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.228.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.228.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.228.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.229.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.229.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.229.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.229.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.229.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.229.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.230.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.230.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.230.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.230.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.230.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.230.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.231.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.231.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.231.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.231.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.231.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.231.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.232.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.232.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.232.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.232.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.232.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.232.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.233.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.233.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.233.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.233.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.233.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.233.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.234.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.234.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.234.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.234.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.234.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.234.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.235.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.235.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.235.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.235.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.235.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.235.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.236.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.236.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.236.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.236.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.236.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.236.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.237.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.237.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.237.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.237.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.237.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.237.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.238.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.238.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.238.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.238.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.238.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.238.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.239.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.239.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.239.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.239.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.239.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.239.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.240.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.240.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.240.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.240.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.240.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.240.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.241.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.241.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.241.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.241.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.241.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.241.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.242.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.242.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.242.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.242.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.242.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.242.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.243.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.243.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.243.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.243.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.243.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.243.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.244.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.244.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.244.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.244.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.244.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.244.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.245.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.245.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.245.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.245.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.245.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.245.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.246.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.246.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.246.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.246.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.246.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.246.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.247.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.247.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.247.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.247.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.247.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.247.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.248.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.248.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.248.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.248.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.248.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.248.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.249.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.249.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.249.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.249.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.249.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.249.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.250.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.250.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.250.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.250.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.250.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.250.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.251.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.251.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.251.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.251.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.251.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.251.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.252.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.252.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.252.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.252.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.252.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.252.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.253.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.253.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.253.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.253.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.253.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.253.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.254.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.254.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.254.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.254.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.254.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.254.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.255.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.255.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.255.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.255.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.mlp.experts.255.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.8.mlp.experts.255.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.8.input_layernorm.weight": "model-00018-of-000163.safetensors", "model.layers.8.post_attention_layernorm.weight": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.q_a_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.self_attn.q_a_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.q_a_layernorm.weight": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.q_b_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.self_attn.q_b_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.kv_a_proj_with_mqa.weight": "model-00018-of-000163.safetensors", - "model.layers.9.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.kv_a_layernorm.weight": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.kv_b_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.self_attn.kv_b_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.self_attn.o_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.self_attn.o_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.gate.weight": "model-00018-of-000163.safetensors", "model.layers.9.mlp.gate.e_score_correction_bias": "model-00018-of-000163.safetensors", "model.layers.9.mlp.shared_experts.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.shared_experts.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.shared_experts.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.shared_experts.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.shared_experts.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.0.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.0.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.0.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.0.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.0.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.0.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.1.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.1.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.1.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.1.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.1.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.1.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.2.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.2.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.2.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.2.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.2.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.2.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.3.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.3.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.3.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.3.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.3.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.3.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.4.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.4.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.4.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.4.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.4.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.4.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.5.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.5.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.5.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.5.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.5.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.5.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.6.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.6.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.6.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.6.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.6.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.6.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.7.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.7.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.7.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.7.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.7.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.7.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.8.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.8.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.8.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.8.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.8.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.8.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.9.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.9.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.9.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.9.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.9.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.9.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.10.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.10.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.10.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.10.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.10.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.10.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.11.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.11.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.11.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.11.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.11.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.11.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.12.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.12.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.12.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.12.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.12.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.12.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.13.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.13.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.13.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.13.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.13.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.13.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.14.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.14.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.14.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.14.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.14.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.14.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.15.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.15.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.15.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.15.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.15.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.15.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.16.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.16.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.16.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.16.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.16.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.16.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.17.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.17.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.17.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.17.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.17.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.17.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.18.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.18.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.18.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.18.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.18.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.18.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.19.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.19.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.19.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.19.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.19.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.19.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.20.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.20.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.20.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.20.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.20.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.20.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.21.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.21.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.21.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.21.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.21.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.21.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.22.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.22.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.22.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.22.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.22.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.22.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.23.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.23.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.23.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.23.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.23.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.23.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.24.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.24.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.24.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.24.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.24.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.24.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.25.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.25.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.25.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.25.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.25.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.25.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.26.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.26.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.26.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.26.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.26.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.26.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.27.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.27.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.27.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.27.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.27.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.27.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.28.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.28.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.28.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.28.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.28.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.28.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.29.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.29.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.29.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.29.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.29.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.29.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.30.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.30.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.30.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.30.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.30.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.30.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.31.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.31.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.31.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.31.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.31.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.31.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.32.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.32.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.32.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.32.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.32.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.32.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.33.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.33.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.33.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.33.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.33.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.33.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.34.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.34.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.34.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.34.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.34.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.34.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.35.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.35.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.35.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.35.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.35.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.35.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.36.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.36.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.36.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.36.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.36.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.36.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.37.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.37.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.37.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.37.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.37.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.37.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.38.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.38.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.38.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.38.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.38.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.38.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.39.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.39.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.39.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.39.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.39.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.39.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.40.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.40.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.40.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.40.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.40.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.40.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.41.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.41.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.41.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.41.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.41.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.41.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.42.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.42.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.42.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.42.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.42.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.42.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.43.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.43.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.43.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.43.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.43.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.43.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.44.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.44.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.44.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.44.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.44.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.44.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.45.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.45.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.45.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.45.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.45.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.45.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.46.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.46.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.46.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.46.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.46.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.46.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.47.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.47.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.47.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.47.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.47.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.47.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.48.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.48.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.48.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.48.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.48.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.48.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.49.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.49.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.49.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.49.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.49.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.49.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.50.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.50.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.50.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.50.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.50.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.50.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.51.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.51.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.51.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.51.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.51.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.51.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.52.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.52.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.52.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.52.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.52.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.52.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.53.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.53.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.53.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.53.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.53.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.53.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.54.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.54.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.54.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.54.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.54.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.54.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.55.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.55.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.55.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.55.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.55.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.55.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.56.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.56.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.56.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.56.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.56.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.56.down_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.57.gate_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.57.gate_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.57.up_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.57.up_proj.weight_scale_inv": "model-00018-of-000163.safetensors", "model.layers.9.mlp.experts.57.down_proj.weight": "model-00018-of-000163.safetensors", - "model.layers.9.mlp.experts.57.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.58.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.58.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.58.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.58.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.58.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.58.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.59.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.59.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.59.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.59.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.59.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.59.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.60.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.60.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.60.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.60.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.60.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.60.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.61.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.61.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.61.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.61.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.61.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.61.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.62.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.62.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.62.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.62.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.62.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.62.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.63.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.63.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.63.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.63.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.63.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.63.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.64.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.64.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.64.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.64.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.64.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.64.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.65.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.65.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.65.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.65.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.65.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.65.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.66.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.66.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.66.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.66.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.66.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.66.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.67.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.67.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.67.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.67.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.67.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.67.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.68.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.68.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.68.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.68.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.68.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.68.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.69.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.69.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.69.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.69.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.69.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.69.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.70.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.70.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.70.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.70.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.70.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.70.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.71.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.71.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.71.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.71.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.71.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.71.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.72.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.72.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.72.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.72.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.72.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.72.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.73.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.73.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.73.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.73.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.73.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.73.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.74.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.74.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.74.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.74.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.74.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.74.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.75.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.75.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.75.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.75.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.75.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.75.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.76.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.76.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.76.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.76.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.76.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.76.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.77.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.77.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.77.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.77.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.77.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.77.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.78.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.78.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.78.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.78.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.78.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.78.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.79.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.79.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.79.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.79.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.79.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.79.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.80.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.80.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.80.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.80.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.80.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.80.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.81.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.81.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.81.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.81.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.81.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.81.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.82.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.82.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.82.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.82.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.82.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.82.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.83.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.83.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.83.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.83.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.83.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.83.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.84.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.84.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.84.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.84.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.84.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.84.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.85.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.85.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.85.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.85.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.85.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.85.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.86.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.86.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.86.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.86.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.86.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.86.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.87.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.87.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.87.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.87.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.87.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.87.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.88.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.88.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.88.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.88.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.88.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.88.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.89.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.89.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.89.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.89.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.89.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.89.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.90.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.90.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.90.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.90.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.90.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.90.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.91.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.91.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.91.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.91.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.91.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.91.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.92.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.92.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.92.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.92.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.92.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.92.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.93.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.93.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.93.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.93.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.93.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.93.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.94.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.94.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.94.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.94.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.94.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.94.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.95.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.95.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.95.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.95.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.95.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.95.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.96.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.96.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.96.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.96.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.96.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.96.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.97.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.97.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.97.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.97.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.97.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.97.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.98.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.98.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.98.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.98.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.98.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.98.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.99.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.99.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.99.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.99.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.99.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.99.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.100.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.100.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.100.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.100.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.100.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.100.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.101.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.101.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.101.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.101.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.101.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.101.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.102.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.102.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.102.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.102.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.102.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.102.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.103.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.103.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.103.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.103.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.103.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.103.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.104.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.104.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.104.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.104.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.104.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.104.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.105.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.105.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.105.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.105.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.105.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.105.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.106.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.106.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.106.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.106.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.106.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.106.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.107.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.107.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.107.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.107.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.107.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.107.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.108.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.108.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.108.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.108.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.108.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.108.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.109.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.109.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.109.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.109.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.109.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.109.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.110.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.110.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.110.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.110.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.110.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.110.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.111.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.111.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.111.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.111.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.111.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.111.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.112.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.112.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.112.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.112.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.112.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.112.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.113.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.113.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.113.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.113.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.113.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.113.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.114.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.114.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.114.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.114.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.114.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.114.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.115.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.115.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.115.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.115.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.115.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.115.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.116.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.116.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.116.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.116.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.116.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.116.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.117.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.117.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.117.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.117.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.117.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.117.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.118.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.118.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.118.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.118.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.118.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.118.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.119.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.119.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.119.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.119.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.119.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.119.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.120.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.120.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.120.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.120.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.120.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.120.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.121.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.121.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.121.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.121.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.121.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.121.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.122.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.122.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.122.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.122.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.122.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.122.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.123.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.123.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.123.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.123.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.123.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.123.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.124.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.124.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.124.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.124.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.124.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.124.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.125.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.125.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.125.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.125.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.125.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.125.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.126.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.126.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.126.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.126.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.126.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.126.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.127.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.127.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.127.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.127.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.127.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.127.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.128.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.128.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.128.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.128.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.128.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.128.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.129.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.129.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.129.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.129.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.129.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.129.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.130.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.130.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.130.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.130.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.130.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.130.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.131.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.131.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.131.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.131.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.131.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.131.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.132.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.132.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.132.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.132.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.132.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.132.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.133.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.133.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.133.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.133.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.133.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.133.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.134.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.134.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.134.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.134.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.134.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.134.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.135.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.135.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.135.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.135.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.135.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.135.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.136.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.136.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.136.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.136.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.136.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.136.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.137.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.137.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.137.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.137.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.137.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.137.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.138.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.138.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.138.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.138.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.138.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.138.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.139.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.139.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.139.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.139.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.139.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.139.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.140.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.140.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.140.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.140.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.140.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.140.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.141.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.141.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.141.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.141.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.141.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.141.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.142.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.142.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.142.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.142.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.142.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.142.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.143.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.143.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.143.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.143.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.143.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.143.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.144.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.144.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.144.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.144.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.144.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.144.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.145.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.145.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.145.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.145.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.145.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.145.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.146.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.146.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.146.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.146.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.146.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.146.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.147.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.147.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.147.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.147.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.147.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.147.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.148.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.148.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.148.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.148.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.148.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.148.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.149.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.149.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.149.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.149.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.149.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.149.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.150.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.150.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.150.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.150.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.150.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.150.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.151.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.151.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.151.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.151.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.151.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.151.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.152.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.152.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.152.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.152.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.152.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.152.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.153.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.153.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.153.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.153.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.153.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.153.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.154.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.154.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.154.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.154.up_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.154.down_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.154.down_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.155.gate_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.155.gate_proj.weight_scale_inv": "model-00019-of-000163.safetensors", "model.layers.9.mlp.experts.155.up_proj.weight": "model-00019-of-000163.safetensors", - "model.layers.9.mlp.experts.155.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.155.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.155.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.156.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.156.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.156.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.156.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.156.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.156.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.157.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.157.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.157.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.157.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.157.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.157.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.158.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.158.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.158.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.158.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.158.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.158.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.159.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.159.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.159.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.159.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.159.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.159.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.160.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.160.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.160.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.160.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.160.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.160.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.161.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.161.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.161.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.161.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.161.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.161.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.162.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.162.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.162.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.162.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.162.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.162.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.163.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.163.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.163.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.163.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.163.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.163.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.164.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.164.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.164.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.164.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.164.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.164.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.165.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.165.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.165.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.165.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.165.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.165.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.166.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.166.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.166.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.166.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.166.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.166.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.167.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.167.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.167.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.167.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.167.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.167.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.168.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.168.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.168.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.168.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.168.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.168.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.169.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.169.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.169.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.169.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.169.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.169.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.170.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.170.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.170.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.170.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.170.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.170.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.171.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.171.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.171.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.171.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.171.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.171.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.172.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.172.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.172.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.172.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.172.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.172.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.173.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.173.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.173.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.173.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.173.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.173.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.174.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.174.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.174.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.174.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.174.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.174.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.175.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.175.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.175.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.175.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.175.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.175.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.176.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.176.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.176.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.176.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.176.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.176.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.177.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.177.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.177.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.177.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.177.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.177.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.178.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.178.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.178.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.178.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.178.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.178.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.179.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.179.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.179.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.179.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.179.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.179.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.180.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.180.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.180.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.180.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.180.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.180.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.181.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.181.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.181.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.181.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.181.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.181.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.182.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.182.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.182.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.182.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.182.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.182.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.183.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.183.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.183.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.183.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.183.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.183.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.184.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.184.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.184.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.184.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.184.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.184.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.185.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.185.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.185.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.185.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.185.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.185.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.186.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.186.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.186.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.186.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.186.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.186.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.187.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.187.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.187.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.187.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.187.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.187.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.188.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.188.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.188.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.188.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.188.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.188.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.189.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.189.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.189.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.189.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.189.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.189.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.190.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.190.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.190.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.190.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.190.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.190.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.191.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.191.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.191.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.191.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.191.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.191.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.192.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.192.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.192.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.192.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.192.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.192.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.193.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.193.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.193.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.193.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.193.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.193.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.194.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.194.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.194.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.194.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.194.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.194.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.195.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.195.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.195.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.195.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.195.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.195.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.196.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.196.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.196.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.196.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.196.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.196.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.197.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.197.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.197.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.197.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.197.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.197.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.198.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.198.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.198.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.198.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.198.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.198.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.199.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.199.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.199.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.199.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.199.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.199.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.200.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.200.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.200.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.200.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.200.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.200.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.201.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.201.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.201.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.201.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.201.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.201.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.202.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.202.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.202.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.202.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.202.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.202.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.203.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.203.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.203.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.203.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.203.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.203.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.204.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.204.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.204.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.204.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.204.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.204.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.205.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.205.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.205.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.205.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.205.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.205.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.206.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.206.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.206.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.206.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.206.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.206.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.207.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.207.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.207.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.207.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.207.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.207.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.208.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.208.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.208.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.208.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.208.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.208.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.209.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.209.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.209.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.209.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.209.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.209.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.210.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.210.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.210.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.210.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.210.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.210.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.211.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.211.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.211.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.211.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.211.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.211.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.212.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.212.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.212.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.212.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.212.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.212.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.213.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.213.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.213.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.213.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.213.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.213.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.214.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.214.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.214.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.214.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.214.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.214.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.215.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.215.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.215.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.215.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.215.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.215.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.216.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.216.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.216.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.216.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.216.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.216.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.217.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.217.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.217.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.217.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.217.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.217.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.218.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.218.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.218.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.218.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.218.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.218.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.219.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.219.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.219.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.219.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.219.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.219.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.220.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.220.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.220.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.220.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.220.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.220.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.221.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.221.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.221.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.221.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.221.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.221.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.222.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.222.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.222.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.222.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.222.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.222.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.223.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.223.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.223.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.223.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.223.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.223.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.224.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.224.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.224.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.224.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.224.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.224.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.225.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.225.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.225.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.225.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.225.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.225.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.226.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.226.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.226.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.226.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.226.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.226.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.227.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.227.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.227.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.227.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.227.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.227.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.228.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.228.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.228.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.228.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.228.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.228.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.229.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.229.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.229.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.229.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.229.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.229.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.230.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.230.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.230.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.230.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.230.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.230.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.231.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.231.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.231.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.231.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.231.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.231.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.232.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.232.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.232.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.232.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.232.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.232.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.233.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.233.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.233.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.233.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.233.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.233.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.234.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.234.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.234.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.234.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.234.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.234.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.235.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.235.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.235.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.235.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.235.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.235.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.236.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.236.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.236.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.236.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.236.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.236.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.237.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.237.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.237.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.237.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.237.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.237.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.238.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.238.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.238.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.238.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.238.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.238.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.239.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.239.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.239.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.239.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.239.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.239.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.240.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.240.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.240.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.240.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.240.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.240.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.241.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.241.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.241.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.241.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.241.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.241.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.242.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.242.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.242.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.242.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.242.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.242.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.243.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.243.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.243.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.243.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.243.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.243.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.244.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.244.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.244.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.244.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.244.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.244.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.245.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.245.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.245.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.245.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.245.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.245.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.246.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.246.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.246.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.246.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.246.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.246.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.247.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.247.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.247.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.247.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.247.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.247.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.248.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.248.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.248.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.248.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.248.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.248.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.249.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.249.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.249.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.249.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.249.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.249.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.250.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.250.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.250.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.250.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.250.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.250.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.251.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.251.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.251.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.251.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.251.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.251.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.252.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.252.gate_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.252.up_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.252.up_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.252.down_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.252.down_proj.weight_scale_inv": "model-00020-of-000163.safetensors", "model.layers.9.mlp.experts.253.gate_proj.weight": "model-00020-of-000163.safetensors", - "model.layers.9.mlp.experts.253.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.253.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.253.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.253.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.253.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.254.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.254.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.254.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.254.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.254.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.254.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.255.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.255.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.255.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.255.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.mlp.experts.255.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.9.mlp.experts.255.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.9.input_layernorm.weight": "model-00021-of-000163.safetensors", "model.layers.9.post_attention_layernorm.weight": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.q_a_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.self_attn.q_a_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.q_a_layernorm.weight": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.q_b_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.self_attn.q_b_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.kv_a_proj_with_mqa.weight": "model-00021-of-000163.safetensors", - "model.layers.10.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.kv_a_layernorm.weight": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.kv_b_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.self_attn.kv_b_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.self_attn.o_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.self_attn.o_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.gate.weight": "model-00021-of-000163.safetensors", "model.layers.10.mlp.gate.e_score_correction_bias": "model-00021-of-000163.safetensors", "model.layers.10.mlp.shared_experts.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.shared_experts.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.shared_experts.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.shared_experts.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.shared_experts.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.0.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.0.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.0.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.0.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.0.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.0.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.1.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.1.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.1.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.1.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.1.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.1.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.2.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.2.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.2.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.2.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.2.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.2.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.3.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.3.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.3.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.3.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.3.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.3.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.4.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.4.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.4.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.4.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.4.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.4.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.5.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.5.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.5.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.5.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.5.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.5.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.6.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.6.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.6.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.6.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.6.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.6.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.7.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.7.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.7.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.7.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.7.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.7.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.8.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.8.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.8.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.8.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.8.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.8.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.9.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.9.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.9.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.9.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.9.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.9.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.10.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.10.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.10.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.10.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.10.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.10.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.11.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.11.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.11.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.11.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.11.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.11.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.12.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.12.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.12.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.12.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.12.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.12.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.13.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.13.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.13.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.13.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.13.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.13.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.14.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.14.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.14.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.14.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.14.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.14.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.15.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.15.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.15.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.15.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.15.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.15.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.16.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.16.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.16.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.16.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.16.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.16.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.17.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.17.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.17.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.17.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.17.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.17.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.18.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.18.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.18.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.18.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.18.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.18.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.19.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.19.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.19.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.19.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.19.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.19.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.20.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.20.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.20.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.20.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.20.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.20.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.21.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.21.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.21.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.21.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.21.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.21.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.22.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.22.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.22.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.22.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.22.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.22.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.23.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.23.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.23.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.23.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.23.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.23.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.24.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.24.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.24.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.24.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.24.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.24.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.25.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.25.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.25.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.25.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.25.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.25.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.26.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.26.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.26.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.26.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.26.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.26.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.27.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.27.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.27.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.27.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.27.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.27.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.28.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.28.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.28.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.28.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.28.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.28.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.29.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.29.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.29.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.29.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.29.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.29.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.30.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.30.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.30.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.30.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.30.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.30.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.31.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.31.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.31.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.31.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.31.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.31.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.32.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.32.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.32.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.32.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.32.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.32.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.33.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.33.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.33.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.33.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.33.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.33.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.34.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.34.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.34.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.34.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.34.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.34.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.35.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.35.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.35.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.35.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.35.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.35.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.36.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.36.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.36.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.36.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.36.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.36.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.37.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.37.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.37.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.37.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.37.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.37.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.38.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.38.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.38.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.38.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.38.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.38.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.39.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.39.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.39.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.39.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.39.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.39.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.40.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.40.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.40.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.40.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.40.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.40.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.41.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.41.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.41.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.41.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.41.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.41.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.42.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.42.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.42.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.42.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.42.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.42.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.43.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.43.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.43.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.43.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.43.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.43.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.44.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.44.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.44.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.44.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.44.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.44.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.45.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.45.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.45.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.45.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.45.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.45.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.46.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.46.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.46.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.46.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.46.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.46.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.47.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.47.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.47.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.47.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.47.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.47.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.48.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.48.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.48.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.48.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.48.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.48.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.49.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.49.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.49.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.49.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.49.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.49.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.50.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.50.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.50.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.50.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.50.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.50.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.51.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.51.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.51.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.51.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.51.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.51.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.52.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.52.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.52.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.52.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.52.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.52.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.53.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.53.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.53.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.53.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.53.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.53.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.54.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.54.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.54.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.54.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.54.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.54.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.55.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.55.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.55.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.55.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.55.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.55.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.56.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.56.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.56.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.56.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.56.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.56.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.57.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.57.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.57.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.57.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.57.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.57.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.58.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.58.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.58.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.58.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.58.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.58.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.59.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.59.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.59.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.59.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.59.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.59.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.60.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.60.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.60.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.60.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.60.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.60.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.61.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.61.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.61.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.61.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.61.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.61.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.62.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.62.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.62.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.62.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.62.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.62.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.63.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.63.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.63.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.63.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.63.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.63.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.64.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.64.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.64.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.64.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.64.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.64.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.65.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.65.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.65.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.65.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.65.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.65.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.66.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.66.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.66.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.66.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.66.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.66.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.67.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.67.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.67.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.67.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.67.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.67.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.68.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.68.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.68.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.68.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.68.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.68.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.69.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.69.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.69.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.69.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.69.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.69.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.70.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.70.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.70.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.70.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.70.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.70.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.71.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.71.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.71.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.71.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.71.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.71.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.72.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.72.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.72.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.72.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.72.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.72.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.73.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.73.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.73.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.73.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.73.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.73.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.74.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.74.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.74.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.74.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.74.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.74.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.75.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.75.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.75.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.75.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.75.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.75.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.76.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.76.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.76.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.76.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.76.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.76.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.77.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.77.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.77.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.77.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.77.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.77.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.78.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.78.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.78.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.78.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.78.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.78.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.79.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.79.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.79.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.79.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.79.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.79.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.80.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.80.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.80.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.80.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.80.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.80.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.81.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.81.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.81.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.81.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.81.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.81.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.82.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.82.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.82.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.82.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.82.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.82.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.83.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.83.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.83.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.83.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.83.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.83.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.84.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.84.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.84.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.84.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.84.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.84.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.85.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.85.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.85.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.85.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.85.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.85.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.86.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.86.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.86.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.86.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.86.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.86.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.87.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.87.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.87.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.87.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.87.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.87.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.88.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.88.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.88.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.88.up_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.88.down_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.88.down_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.89.gate_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.89.gate_proj.weight_scale_inv": "model-00021-of-000163.safetensors", "model.layers.10.mlp.experts.89.up_proj.weight": "model-00021-of-000163.safetensors", - "model.layers.10.mlp.experts.89.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.89.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.89.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.90.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.90.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.90.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.90.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.90.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.90.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.91.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.91.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.91.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.91.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.91.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.91.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.92.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.92.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.92.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.92.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.92.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.92.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.93.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.93.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.93.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.93.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.93.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.93.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.94.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.94.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.94.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.94.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.94.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.94.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.95.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.95.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.95.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.95.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.95.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.95.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.96.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.96.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.96.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.96.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.96.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.96.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.97.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.97.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.97.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.97.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.97.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.97.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.98.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.98.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.98.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.98.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.98.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.98.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.99.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.99.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.99.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.99.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.99.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.99.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.100.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.100.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.100.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.100.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.100.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.100.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.101.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.101.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.101.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.101.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.101.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.101.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.102.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.102.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.102.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.102.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.102.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.102.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.103.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.103.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.103.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.103.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.103.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.103.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.104.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.104.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.104.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.104.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.104.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.104.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.105.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.105.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.105.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.105.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.105.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.105.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.106.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.106.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.106.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.106.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.106.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.106.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.107.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.107.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.107.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.107.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.107.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.107.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.108.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.108.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.108.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.108.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.108.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.108.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.109.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.109.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.109.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.109.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.109.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.109.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.110.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.110.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.110.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.110.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.110.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.110.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.111.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.111.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.111.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.111.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.111.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.111.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.112.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.112.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.112.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.112.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.112.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.112.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.113.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.113.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.113.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.113.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.113.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.113.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.114.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.114.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.114.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.114.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.114.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.114.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.115.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.115.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.115.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.115.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.115.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.115.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.116.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.116.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.116.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.116.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.116.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.116.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.117.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.117.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.117.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.117.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.117.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.117.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.118.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.118.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.118.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.118.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.118.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.118.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.119.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.119.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.119.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.119.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.119.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.119.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.120.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.120.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.120.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.120.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.120.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.120.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.121.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.121.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.121.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.121.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.121.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.121.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.122.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.122.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.122.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.122.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.122.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.122.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.123.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.123.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.123.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.123.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.123.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.123.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.124.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.124.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.124.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.124.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.124.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.124.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.125.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.125.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.125.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.125.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.125.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.125.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.126.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.126.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.126.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.126.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.126.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.126.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.127.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.127.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.127.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.127.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.127.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.127.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.128.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.128.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.128.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.128.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.128.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.128.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.129.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.129.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.129.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.129.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.129.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.129.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.130.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.130.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.130.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.130.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.130.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.130.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.131.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.131.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.131.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.131.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.131.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.131.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.132.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.132.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.132.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.132.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.132.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.132.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.133.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.133.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.133.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.133.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.133.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.133.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.134.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.134.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.134.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.134.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.134.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.134.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.135.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.135.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.135.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.135.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.135.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.135.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.136.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.136.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.136.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.136.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.136.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.136.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.137.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.137.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.137.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.137.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.137.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.137.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.138.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.138.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.138.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.138.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.138.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.138.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.139.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.139.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.139.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.139.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.139.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.139.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.140.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.140.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.140.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.140.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.140.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.140.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.141.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.141.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.141.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.141.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.141.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.141.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.142.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.142.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.142.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.142.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.142.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.142.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.143.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.143.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.143.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.143.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.143.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.143.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.144.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.144.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.144.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.144.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.144.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.144.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.145.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.145.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.145.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.145.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.145.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.145.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.146.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.146.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.146.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.146.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.146.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.146.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.147.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.147.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.147.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.147.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.147.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.147.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.148.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.148.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.148.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.148.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.148.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.148.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.149.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.149.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.149.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.149.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.149.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.149.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.150.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.150.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.150.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.150.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.150.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.150.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.151.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.151.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.151.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.151.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.151.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.151.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.152.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.152.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.152.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.152.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.152.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.152.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.153.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.153.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.153.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.153.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.153.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.153.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.154.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.154.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.154.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.154.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.154.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.154.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.155.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.155.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.155.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.155.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.155.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.155.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.156.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.156.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.156.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.156.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.156.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.156.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.157.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.157.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.157.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.157.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.157.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.157.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.158.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.158.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.158.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.158.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.158.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.158.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.159.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.159.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.159.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.159.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.159.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.159.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.160.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.160.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.160.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.160.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.160.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.160.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.161.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.161.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.161.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.161.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.161.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.161.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.162.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.162.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.162.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.162.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.162.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.162.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.163.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.163.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.163.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.163.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.163.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.163.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.164.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.164.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.164.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.164.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.164.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.164.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.165.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.165.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.165.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.165.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.165.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.165.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.166.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.166.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.166.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.166.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.166.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.166.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.167.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.167.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.167.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.167.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.167.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.167.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.168.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.168.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.168.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.168.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.168.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.168.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.169.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.169.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.169.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.169.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.169.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.169.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.170.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.170.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.170.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.170.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.170.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.170.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.171.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.171.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.171.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.171.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.171.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.171.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.172.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.172.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.172.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.172.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.172.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.172.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.173.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.173.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.173.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.173.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.173.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.173.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.174.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.174.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.174.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.174.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.174.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.174.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.175.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.175.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.175.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.175.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.175.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.175.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.176.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.176.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.176.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.176.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.176.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.176.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.177.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.177.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.177.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.177.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.177.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.177.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.178.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.178.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.178.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.178.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.178.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.178.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.179.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.179.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.179.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.179.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.179.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.179.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.180.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.180.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.180.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.180.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.180.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.180.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.181.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.181.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.181.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.181.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.181.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.181.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.182.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.182.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.182.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.182.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.182.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.182.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.183.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.183.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.183.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.183.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.183.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.183.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.184.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.184.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.184.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.184.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.184.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.184.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.185.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.185.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.185.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.185.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.185.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.185.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.186.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.186.gate_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.186.up_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.186.up_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.186.down_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.186.down_proj.weight_scale_inv": "model-00022-of-000163.safetensors", "model.layers.10.mlp.experts.187.gate_proj.weight": "model-00022-of-000163.safetensors", - "model.layers.10.mlp.experts.187.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.187.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.187.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.187.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.187.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.188.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.188.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.188.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.188.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.188.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.188.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.189.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.189.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.189.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.189.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.189.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.189.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.190.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.190.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.190.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.190.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.190.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.190.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.191.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.191.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.191.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.191.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.191.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.191.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.192.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.192.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.192.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.192.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.192.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.192.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.193.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.193.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.193.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.193.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.193.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.193.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.194.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.194.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.194.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.194.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.194.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.194.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.195.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.195.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.195.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.195.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.195.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.195.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.196.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.196.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.196.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.196.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.196.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.196.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.197.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.197.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.197.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.197.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.197.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.197.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.198.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.198.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.198.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.198.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.198.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.198.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.199.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.199.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.199.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.199.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.199.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.199.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.200.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.200.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.200.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.200.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.200.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.200.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.201.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.201.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.201.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.201.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.201.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.201.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.202.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.202.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.202.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.202.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.202.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.202.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.203.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.203.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.203.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.203.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.203.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.203.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.204.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.204.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.204.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.204.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.204.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.204.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.205.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.205.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.205.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.205.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.205.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.205.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.206.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.206.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.206.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.206.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.206.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.206.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.207.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.207.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.207.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.207.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.207.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.207.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.208.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.208.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.208.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.208.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.208.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.208.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.209.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.209.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.209.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.209.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.209.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.209.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.210.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.210.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.210.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.210.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.210.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.210.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.211.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.211.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.211.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.211.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.211.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.211.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.212.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.212.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.212.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.212.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.212.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.212.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.213.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.213.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.213.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.213.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.213.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.213.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.214.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.214.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.214.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.214.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.214.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.214.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.215.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.215.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.215.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.215.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.215.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.215.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.216.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.216.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.216.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.216.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.216.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.216.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.217.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.217.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.217.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.217.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.217.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.217.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.218.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.218.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.218.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.218.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.218.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.218.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.219.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.219.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.219.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.219.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.219.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.219.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.220.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.220.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.220.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.220.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.220.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.220.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.221.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.221.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.221.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.221.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.221.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.221.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.222.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.222.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.222.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.222.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.222.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.222.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.223.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.223.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.223.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.223.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.223.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.223.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.224.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.224.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.224.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.224.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.224.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.224.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.225.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.225.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.225.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.225.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.225.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.225.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.226.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.226.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.226.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.226.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.226.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.226.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.227.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.227.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.227.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.227.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.227.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.227.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.228.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.228.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.228.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.228.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.228.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.228.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.229.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.229.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.229.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.229.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.229.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.229.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.230.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.230.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.230.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.230.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.230.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.230.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.231.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.231.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.231.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.231.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.231.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.231.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.232.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.232.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.232.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.232.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.232.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.232.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.233.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.233.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.233.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.233.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.233.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.233.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.234.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.234.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.234.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.234.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.234.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.234.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.235.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.235.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.235.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.235.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.235.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.235.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.236.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.236.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.236.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.236.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.236.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.236.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.237.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.237.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.237.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.237.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.237.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.237.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.238.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.238.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.238.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.238.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.238.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.238.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.239.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.239.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.239.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.239.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.239.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.239.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.240.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.240.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.240.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.240.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.240.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.240.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.241.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.241.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.241.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.241.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.241.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.241.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.242.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.242.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.242.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.242.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.242.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.242.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.243.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.243.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.243.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.243.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.243.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.243.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.244.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.244.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.244.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.244.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.244.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.244.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.245.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.245.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.245.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.245.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.245.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.245.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.246.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.246.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.246.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.246.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.246.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.246.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.247.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.247.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.247.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.247.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.247.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.247.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.248.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.248.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.248.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.248.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.248.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.248.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.249.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.249.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.249.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.249.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.249.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.249.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.250.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.250.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.250.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.250.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.250.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.250.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.251.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.251.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.251.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.251.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.251.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.251.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.252.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.252.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.252.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.252.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.252.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.252.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.253.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.253.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.253.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.253.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.253.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.253.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.254.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.254.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.254.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.254.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.254.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.254.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.255.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.255.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.255.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.255.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.mlp.experts.255.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.10.mlp.experts.255.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.10.input_layernorm.weight": "model-00023-of-000163.safetensors", "model.layers.10.post_attention_layernorm.weight": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.q_a_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.self_attn.q_a_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.q_a_layernorm.weight": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.q_b_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.self_attn.q_b_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.kv_a_proj_with_mqa.weight": "model-00023-of-000163.safetensors", - "model.layers.11.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.kv_a_layernorm.weight": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.kv_b_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.self_attn.kv_b_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.self_attn.o_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.self_attn.o_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.gate.weight": "model-00023-of-000163.safetensors", "model.layers.11.mlp.gate.e_score_correction_bias": "model-00023-of-000163.safetensors", "model.layers.11.mlp.shared_experts.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.shared_experts.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.shared_experts.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.shared_experts.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.shared_experts.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.0.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.0.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.0.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.0.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.0.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.0.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.1.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.1.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.1.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.1.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.1.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.1.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.2.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.2.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.2.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.2.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.2.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.2.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.3.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.3.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.3.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.3.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.3.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.3.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.4.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.4.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.4.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.4.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.4.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.4.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.5.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.5.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.5.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.5.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.5.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.5.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.6.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.6.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.6.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.6.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.6.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.6.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.7.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.7.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.7.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.7.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.7.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.7.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.8.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.8.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.8.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.8.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.8.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.8.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.9.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.9.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.9.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.9.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.9.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.9.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.10.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.10.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.10.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.10.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.10.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.10.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.11.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.11.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.11.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.11.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.11.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.11.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.12.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.12.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.12.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.12.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.12.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.12.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.13.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.13.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.13.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.13.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.13.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.13.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.14.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.14.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.14.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.14.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.14.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.14.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.15.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.15.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.15.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.15.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.15.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.15.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.16.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.16.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.16.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.16.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.16.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.16.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.17.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.17.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.17.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.17.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.17.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.17.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.18.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.18.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.18.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.18.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.18.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.18.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.19.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.19.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.19.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.19.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.19.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.19.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.20.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.20.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.20.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.20.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.20.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.20.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.21.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.21.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.21.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.21.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.21.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.21.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.22.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.22.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.22.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.22.up_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.22.down_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.22.down_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.23.gate_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.23.gate_proj.weight_scale_inv": "model-00023-of-000163.safetensors", "model.layers.11.mlp.experts.23.up_proj.weight": "model-00023-of-000163.safetensors", - "model.layers.11.mlp.experts.23.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.23.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.23.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.24.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.24.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.24.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.24.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.24.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.24.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.25.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.25.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.25.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.25.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.25.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.25.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.26.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.26.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.26.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.26.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.26.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.26.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.27.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.27.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.27.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.27.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.27.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.27.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.28.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.28.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.28.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.28.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.28.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.28.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.29.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.29.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.29.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.29.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.29.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.29.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.30.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.30.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.30.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.30.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.30.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.30.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.31.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.31.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.31.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.31.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.31.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.31.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.32.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.32.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.32.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.32.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.32.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.32.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.33.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.33.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.33.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.33.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.33.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.33.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.34.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.34.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.34.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.34.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.34.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.34.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.35.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.35.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.35.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.35.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.35.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.35.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.36.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.36.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.36.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.36.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.36.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.36.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.37.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.37.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.37.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.37.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.37.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.37.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.38.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.38.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.38.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.38.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.38.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.38.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.39.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.39.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.39.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.39.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.39.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.39.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.40.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.40.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.40.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.40.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.40.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.40.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.41.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.41.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.41.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.41.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.41.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.41.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.42.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.42.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.42.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.42.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.42.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.42.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.43.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.43.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.43.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.43.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.43.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.43.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.44.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.44.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.44.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.44.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.44.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.44.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.45.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.45.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.45.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.45.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.45.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.45.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.46.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.46.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.46.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.46.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.46.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.46.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.47.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.47.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.47.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.47.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.47.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.47.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.48.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.48.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.48.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.48.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.48.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.48.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.49.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.49.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.49.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.49.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.49.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.49.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.50.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.50.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.50.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.50.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.50.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.50.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.51.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.51.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.51.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.51.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.51.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.51.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.52.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.52.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.52.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.52.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.52.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.52.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.53.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.53.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.53.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.53.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.53.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.53.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.54.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.54.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.54.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.54.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.54.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.54.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.55.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.55.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.55.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.55.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.55.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.55.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.56.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.56.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.56.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.56.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.56.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.56.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.57.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.57.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.57.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.57.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.57.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.57.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.58.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.58.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.58.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.58.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.58.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.58.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.59.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.59.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.59.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.59.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.59.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.59.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.60.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.60.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.60.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.60.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.60.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.60.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.61.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.61.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.61.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.61.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.61.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.61.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.62.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.62.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.62.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.62.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.62.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.62.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.63.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.63.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.63.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.63.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.63.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.63.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.64.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.64.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.64.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.64.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.64.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.64.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.65.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.65.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.65.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.65.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.65.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.65.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.66.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.66.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.66.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.66.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.66.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.66.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.67.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.67.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.67.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.67.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.67.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.67.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.68.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.68.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.68.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.68.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.68.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.68.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.69.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.69.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.69.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.69.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.69.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.69.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.70.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.70.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.70.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.70.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.70.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.70.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.71.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.71.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.71.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.71.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.71.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.71.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.72.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.72.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.72.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.72.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.72.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.72.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.73.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.73.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.73.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.73.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.73.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.73.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.74.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.74.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.74.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.74.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.74.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.74.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.75.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.75.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.75.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.75.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.75.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.75.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.76.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.76.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.76.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.76.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.76.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.76.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.77.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.77.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.77.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.77.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.77.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.77.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.78.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.78.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.78.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.78.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.78.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.78.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.79.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.79.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.79.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.79.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.79.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.79.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.80.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.80.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.80.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.80.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.80.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.80.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.81.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.81.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.81.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.81.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.81.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.81.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.82.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.82.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.82.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.82.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.82.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.82.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.83.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.83.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.83.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.83.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.83.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.83.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.84.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.84.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.84.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.84.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.84.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.84.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.85.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.85.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.85.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.85.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.85.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.85.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.86.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.86.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.86.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.86.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.86.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.86.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.87.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.87.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.87.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.87.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.87.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.87.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.88.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.88.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.88.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.88.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.88.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.88.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.89.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.89.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.89.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.89.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.89.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.89.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.90.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.90.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.90.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.90.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.90.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.90.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.91.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.91.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.91.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.91.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.91.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.91.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.92.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.92.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.92.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.92.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.92.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.92.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.93.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.93.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.93.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.93.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.93.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.93.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.94.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.94.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.94.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.94.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.94.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.94.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.95.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.95.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.95.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.95.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.95.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.95.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.96.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.96.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.96.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.96.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.96.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.96.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.97.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.97.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.97.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.97.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.97.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.97.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.98.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.98.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.98.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.98.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.98.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.98.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.99.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.99.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.99.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.99.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.99.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.99.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.100.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.100.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.100.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.100.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.100.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.100.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.101.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.101.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.101.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.101.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.101.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.101.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.102.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.102.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.102.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.102.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.102.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.102.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.103.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.103.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.103.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.103.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.103.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.103.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.104.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.104.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.104.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.104.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.104.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.104.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.105.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.105.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.105.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.105.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.105.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.105.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.106.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.106.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.106.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.106.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.106.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.106.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.107.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.107.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.107.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.107.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.107.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.107.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.108.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.108.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.108.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.108.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.108.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.108.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.109.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.109.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.109.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.109.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.109.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.109.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.110.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.110.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.110.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.110.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.110.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.110.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.111.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.111.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.111.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.111.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.111.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.111.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.112.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.112.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.112.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.112.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.112.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.112.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.113.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.113.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.113.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.113.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.113.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.113.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.114.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.114.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.114.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.114.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.114.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.114.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.115.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.115.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.115.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.115.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.115.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.115.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.116.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.116.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.116.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.116.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.116.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.116.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.117.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.117.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.117.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.117.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.117.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.117.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.118.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.118.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.118.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.118.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.118.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.118.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.119.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.119.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.119.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.119.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.119.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.119.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.120.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.120.gate_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.120.up_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.120.up_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.120.down_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.120.down_proj.weight_scale_inv": "model-00024-of-000163.safetensors", "model.layers.11.mlp.experts.121.gate_proj.weight": "model-00024-of-000163.safetensors", - "model.layers.11.mlp.experts.121.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.121.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.121.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.121.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.121.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.122.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.122.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.122.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.122.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.122.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.122.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.123.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.123.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.123.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.123.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.123.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.123.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.124.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.124.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.124.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.124.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.124.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.124.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.125.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.125.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.125.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.125.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.125.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.125.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.126.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.126.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.126.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.126.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.126.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.126.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.127.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.127.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.127.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.127.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.127.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.127.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.128.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.128.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.128.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.128.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.128.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.128.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.129.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.129.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.129.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.129.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.129.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.129.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.130.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.130.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.130.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.130.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.130.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.130.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.131.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.131.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.131.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.131.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.131.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.131.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.132.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.132.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.132.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.132.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.132.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.132.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.133.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.133.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.133.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.133.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.133.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.133.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.134.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.134.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.134.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.134.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.134.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.134.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.135.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.135.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.135.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.135.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.135.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.135.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.136.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.136.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.136.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.136.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.136.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.136.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.137.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.137.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.137.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.137.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.137.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.137.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.138.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.138.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.138.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.138.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.138.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.138.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.139.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.139.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.139.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.139.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.139.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.139.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.140.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.140.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.140.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.140.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.140.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.140.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.141.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.141.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.141.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.141.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.141.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.141.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.142.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.142.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.142.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.142.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.142.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.142.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.143.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.143.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.143.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.143.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.143.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.143.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.144.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.144.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.144.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.144.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.144.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.144.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.145.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.145.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.145.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.145.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.145.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.145.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.146.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.146.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.146.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.146.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.146.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.146.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.147.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.147.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.147.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.147.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.147.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.147.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.148.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.148.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.148.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.148.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.148.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.148.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.149.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.149.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.149.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.149.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.149.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.149.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.150.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.150.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.150.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.150.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.150.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.150.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.151.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.151.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.151.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.151.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.151.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.151.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.152.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.152.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.152.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.152.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.152.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.152.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.153.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.153.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.153.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.153.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.153.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.153.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.154.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.154.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.154.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.154.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.154.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.154.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.155.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.155.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.155.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.155.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.155.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.155.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.156.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.156.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.156.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.156.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.156.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.156.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.157.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.157.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.157.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.157.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.157.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.157.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.158.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.158.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.158.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.158.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.158.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.158.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.159.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.159.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.159.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.159.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.159.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.159.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.160.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.160.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.160.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.160.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.160.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.160.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.161.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.161.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.161.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.161.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.161.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.161.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.162.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.162.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.162.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.162.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.162.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.162.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.163.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.163.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.163.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.163.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.163.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.163.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.164.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.164.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.164.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.164.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.164.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.164.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.165.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.165.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.165.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.165.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.165.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.165.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.166.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.166.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.166.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.166.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.166.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.166.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.167.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.167.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.167.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.167.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.167.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.167.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.168.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.168.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.168.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.168.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.168.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.168.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.169.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.169.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.169.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.169.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.169.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.169.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.170.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.170.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.170.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.170.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.170.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.170.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.171.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.171.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.171.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.171.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.171.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.171.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.172.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.172.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.172.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.172.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.172.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.172.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.173.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.173.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.173.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.173.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.173.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.173.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.174.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.174.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.174.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.174.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.174.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.174.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.175.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.175.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.175.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.175.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.175.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.175.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.176.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.176.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.176.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.176.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.176.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.176.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.177.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.177.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.177.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.177.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.177.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.177.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.178.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.178.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.178.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.178.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.178.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.178.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.179.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.179.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.179.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.179.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.179.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.179.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.180.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.180.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.180.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.180.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.180.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.180.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.181.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.181.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.181.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.181.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.181.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.181.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.182.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.182.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.182.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.182.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.182.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.182.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.183.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.183.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.183.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.183.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.183.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.183.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.184.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.184.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.184.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.184.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.184.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.184.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.185.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.185.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.185.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.185.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.185.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.185.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.186.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.186.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.186.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.186.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.186.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.186.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.187.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.187.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.187.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.187.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.187.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.187.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.188.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.188.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.188.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.188.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.188.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.188.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.189.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.189.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.189.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.189.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.189.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.189.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.190.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.190.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.190.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.190.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.190.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.190.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.191.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.191.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.191.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.191.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.191.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.191.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.192.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.192.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.192.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.192.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.192.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.192.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.193.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.193.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.193.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.193.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.193.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.193.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.194.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.194.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.194.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.194.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.194.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.194.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.195.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.195.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.195.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.195.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.195.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.195.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.196.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.196.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.196.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.196.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.196.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.196.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.197.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.197.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.197.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.197.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.197.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.197.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.198.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.198.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.198.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.198.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.198.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.198.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.199.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.199.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.199.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.199.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.199.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.199.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.200.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.200.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.200.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.200.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.200.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.200.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.201.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.201.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.201.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.201.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.201.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.201.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.202.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.202.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.202.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.202.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.202.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.202.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.203.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.203.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.203.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.203.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.203.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.203.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.204.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.204.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.204.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.204.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.204.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.204.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.205.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.205.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.205.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.205.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.205.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.205.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.206.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.206.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.206.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.206.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.206.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.206.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.207.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.207.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.207.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.207.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.207.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.207.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.208.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.208.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.208.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.208.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.208.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.208.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.209.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.209.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.209.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.209.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.209.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.209.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.210.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.210.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.210.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.210.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.210.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.210.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.211.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.211.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.211.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.211.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.211.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.211.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.212.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.212.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.212.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.212.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.212.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.212.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.213.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.213.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.213.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.213.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.213.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.213.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.214.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.214.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.214.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.214.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.214.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.214.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.215.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.215.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.215.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.215.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.215.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.215.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.216.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.216.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.216.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.216.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.216.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.216.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.217.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.217.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.217.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.217.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.217.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.217.down_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.218.gate_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.218.gate_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.218.up_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.218.up_proj.weight_scale_inv": "model-00025-of-000163.safetensors", "model.layers.11.mlp.experts.218.down_proj.weight": "model-00025-of-000163.safetensors", - "model.layers.11.mlp.experts.218.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.219.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.219.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.219.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.219.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.219.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.219.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.220.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.220.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.220.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.220.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.220.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.220.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.221.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.221.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.221.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.221.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.221.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.221.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.222.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.222.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.222.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.222.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.222.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.222.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.223.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.223.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.223.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.223.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.223.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.223.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.224.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.224.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.224.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.224.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.224.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.224.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.225.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.225.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.225.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.225.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.225.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.225.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.226.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.226.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.226.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.226.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.226.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.226.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.227.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.227.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.227.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.227.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.227.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.227.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.228.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.228.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.228.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.228.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.228.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.228.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.229.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.229.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.229.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.229.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.229.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.229.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.230.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.230.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.230.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.230.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.230.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.230.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.231.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.231.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.231.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.231.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.231.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.231.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.232.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.232.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.232.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.232.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.232.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.232.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.233.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.233.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.233.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.233.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.233.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.233.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.234.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.234.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.234.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.234.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.234.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.234.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.235.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.235.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.235.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.235.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.235.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.235.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.236.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.236.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.236.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.236.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.236.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.236.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.237.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.237.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.237.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.237.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.237.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.237.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.238.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.238.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.238.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.238.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.238.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.238.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.239.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.239.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.239.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.239.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.239.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.239.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.240.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.240.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.240.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.240.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.240.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.240.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.241.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.241.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.241.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.241.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.241.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.241.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.242.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.242.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.242.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.242.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.242.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.242.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.243.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.243.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.243.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.243.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.243.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.243.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.244.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.244.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.244.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.244.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.244.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.244.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.245.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.245.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.245.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.245.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.245.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.245.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.246.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.246.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.246.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.246.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.246.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.246.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.247.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.247.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.247.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.247.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.247.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.247.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.248.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.248.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.248.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.248.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.248.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.248.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.249.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.249.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.249.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.249.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.249.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.249.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.250.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.250.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.250.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.250.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.250.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.250.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.251.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.251.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.251.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.251.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.251.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.251.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.252.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.252.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.252.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.252.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.252.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.252.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.253.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.253.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.253.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.253.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.253.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.253.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.254.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.254.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.254.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.254.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.254.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.254.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.255.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.255.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.255.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.255.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.mlp.experts.255.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.11.mlp.experts.255.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.11.input_layernorm.weight": "model-00026-of-000163.safetensors", "model.layers.11.post_attention_layernorm.weight": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.q_a_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.self_attn.q_a_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.q_a_layernorm.weight": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.q_b_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.self_attn.q_b_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.kv_a_proj_with_mqa.weight": "model-00026-of-000163.safetensors", - "model.layers.12.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.kv_a_layernorm.weight": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.kv_b_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.self_attn.kv_b_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.self_attn.o_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.self_attn.o_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.gate.weight": "model-00026-of-000163.safetensors", "model.layers.12.mlp.gate.e_score_correction_bias": "model-00026-of-000163.safetensors", "model.layers.12.mlp.shared_experts.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.shared_experts.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.shared_experts.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.shared_experts.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.shared_experts.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.0.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.0.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.0.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.0.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.0.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.0.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.1.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.1.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.1.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.1.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.1.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.1.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.2.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.2.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.2.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.2.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.2.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.2.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.3.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.3.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.3.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.3.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.3.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.3.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.4.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.4.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.4.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.4.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.4.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.4.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.5.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.5.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.5.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.5.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.5.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.5.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.6.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.6.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.6.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.6.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.6.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.6.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.7.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.7.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.7.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.7.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.7.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.7.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.8.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.8.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.8.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.8.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.8.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.8.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.9.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.9.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.9.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.9.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.9.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.9.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.10.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.10.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.10.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.10.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.10.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.10.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.11.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.11.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.11.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.11.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.11.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.11.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.12.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.12.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.12.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.12.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.12.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.12.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.13.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.13.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.13.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.13.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.13.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.13.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.14.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.14.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.14.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.14.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.14.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.14.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.15.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.15.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.15.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.15.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.15.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.15.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.16.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.16.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.16.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.16.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.16.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.16.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.17.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.17.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.17.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.17.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.17.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.17.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.18.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.18.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.18.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.18.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.18.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.18.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.19.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.19.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.19.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.19.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.19.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.19.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.20.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.20.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.20.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.20.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.20.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.20.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.21.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.21.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.21.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.21.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.21.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.21.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.22.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.22.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.22.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.22.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.22.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.22.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.23.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.23.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.23.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.23.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.23.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.23.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.24.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.24.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.24.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.24.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.24.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.24.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.25.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.25.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.25.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.25.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.25.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.25.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.26.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.26.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.26.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.26.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.26.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.26.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.27.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.27.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.27.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.27.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.27.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.27.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.28.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.28.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.28.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.28.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.28.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.28.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.29.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.29.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.29.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.29.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.29.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.29.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.30.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.30.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.30.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.30.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.30.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.30.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.31.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.31.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.31.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.31.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.31.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.31.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.32.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.32.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.32.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.32.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.32.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.32.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.33.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.33.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.33.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.33.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.33.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.33.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.34.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.34.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.34.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.34.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.34.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.34.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.35.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.35.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.35.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.35.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.35.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.35.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.36.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.36.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.36.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.36.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.36.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.36.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.37.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.37.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.37.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.37.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.37.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.37.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.38.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.38.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.38.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.38.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.38.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.38.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.39.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.39.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.39.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.39.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.39.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.39.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.40.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.40.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.40.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.40.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.40.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.40.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.41.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.41.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.41.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.41.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.41.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.41.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.42.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.42.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.42.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.42.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.42.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.42.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.43.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.43.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.43.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.43.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.43.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.43.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.44.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.44.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.44.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.44.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.44.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.44.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.45.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.45.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.45.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.45.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.45.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.45.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.46.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.46.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.46.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.46.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.46.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.46.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.47.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.47.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.47.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.47.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.47.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.47.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.48.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.48.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.48.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.48.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.48.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.48.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.49.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.49.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.49.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.49.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.49.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.49.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.50.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.50.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.50.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.50.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.50.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.50.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.51.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.51.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.51.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.51.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.51.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.51.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.52.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.52.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.52.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.52.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.52.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.52.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.53.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.53.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.53.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.53.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.53.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.53.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.54.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.54.gate_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.54.up_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.54.up_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.54.down_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.54.down_proj.weight_scale_inv": "model-00026-of-000163.safetensors", "model.layers.12.mlp.experts.55.gate_proj.weight": "model-00026-of-000163.safetensors", - "model.layers.12.mlp.experts.55.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.55.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.55.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.55.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.55.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.56.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.56.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.56.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.56.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.56.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.56.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.57.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.57.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.57.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.57.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.57.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.57.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.58.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.58.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.58.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.58.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.58.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.58.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.59.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.59.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.59.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.59.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.59.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.59.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.60.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.60.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.60.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.60.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.60.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.60.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.61.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.61.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.61.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.61.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.61.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.61.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.62.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.62.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.62.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.62.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.62.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.62.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.63.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.63.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.63.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.63.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.63.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.63.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.64.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.64.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.64.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.64.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.64.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.64.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.65.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.65.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.65.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.65.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.65.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.65.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.66.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.66.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.66.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.66.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.66.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.66.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.67.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.67.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.67.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.67.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.67.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.67.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.68.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.68.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.68.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.68.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.68.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.68.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.69.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.69.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.69.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.69.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.69.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.69.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.70.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.70.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.70.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.70.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.70.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.70.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.71.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.71.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.71.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.71.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.71.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.71.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.72.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.72.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.72.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.72.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.72.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.72.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.73.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.73.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.73.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.73.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.73.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.73.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.74.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.74.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.74.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.74.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.74.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.74.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.75.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.75.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.75.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.75.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.75.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.75.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.76.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.76.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.76.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.76.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.76.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.76.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.77.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.77.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.77.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.77.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.77.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.77.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.78.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.78.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.78.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.78.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.78.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.78.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.79.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.79.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.79.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.79.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.79.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.79.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.80.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.80.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.80.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.80.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.80.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.80.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.81.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.81.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.81.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.81.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.81.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.81.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.82.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.82.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.82.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.82.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.82.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.82.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.83.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.83.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.83.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.83.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.83.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.83.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.84.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.84.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.84.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.84.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.84.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.84.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.85.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.85.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.85.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.85.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.85.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.85.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.86.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.86.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.86.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.86.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.86.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.86.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.87.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.87.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.87.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.87.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.87.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.87.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.88.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.88.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.88.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.88.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.88.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.88.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.89.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.89.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.89.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.89.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.89.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.89.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.90.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.90.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.90.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.90.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.90.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.90.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.91.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.91.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.91.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.91.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.91.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.91.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.92.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.92.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.92.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.92.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.92.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.92.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.93.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.93.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.93.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.93.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.93.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.93.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.94.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.94.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.94.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.94.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.94.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.94.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.95.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.95.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.95.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.95.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.95.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.95.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.96.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.96.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.96.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.96.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.96.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.96.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.97.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.97.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.97.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.97.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.97.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.97.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.98.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.98.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.98.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.98.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.98.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.98.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.99.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.99.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.99.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.99.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.99.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.99.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.100.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.100.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.100.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.100.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.100.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.100.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.101.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.101.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.101.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.101.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.101.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.101.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.102.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.102.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.102.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.102.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.102.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.102.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.103.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.103.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.103.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.103.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.103.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.103.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.104.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.104.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.104.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.104.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.104.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.104.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.105.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.105.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.105.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.105.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.105.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.105.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.106.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.106.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.106.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.106.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.106.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.106.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.107.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.107.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.107.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.107.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.107.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.107.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.108.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.108.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.108.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.108.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.108.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.108.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.109.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.109.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.109.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.109.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.109.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.109.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.110.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.110.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.110.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.110.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.110.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.110.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.111.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.111.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.111.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.111.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.111.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.111.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.112.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.112.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.112.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.112.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.112.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.112.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.113.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.113.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.113.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.113.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.113.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.113.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.114.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.114.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.114.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.114.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.114.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.114.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.115.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.115.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.115.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.115.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.115.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.115.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.116.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.116.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.116.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.116.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.116.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.116.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.117.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.117.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.117.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.117.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.117.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.117.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.118.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.118.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.118.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.118.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.118.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.118.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.119.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.119.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.119.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.119.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.119.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.119.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.120.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.120.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.120.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.120.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.120.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.120.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.121.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.121.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.121.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.121.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.121.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.121.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.122.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.122.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.122.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.122.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.122.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.122.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.123.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.123.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.123.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.123.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.123.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.123.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.124.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.124.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.124.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.124.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.124.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.124.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.125.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.125.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.125.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.125.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.125.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.125.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.126.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.126.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.126.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.126.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.126.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.126.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.127.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.127.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.127.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.127.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.127.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.127.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.128.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.128.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.128.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.128.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.128.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.128.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.129.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.129.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.129.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.129.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.129.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.129.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.130.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.130.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.130.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.130.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.130.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.130.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.131.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.131.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.131.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.131.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.131.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.131.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.132.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.132.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.132.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.132.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.132.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.132.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.133.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.133.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.133.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.133.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.133.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.133.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.134.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.134.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.134.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.134.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.134.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.134.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.135.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.135.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.135.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.135.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.135.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.135.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.136.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.136.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.136.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.136.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.136.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.136.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.137.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.137.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.137.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.137.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.137.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.137.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.138.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.138.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.138.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.138.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.138.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.138.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.139.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.139.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.139.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.139.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.139.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.139.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.140.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.140.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.140.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.140.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.140.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.140.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.141.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.141.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.141.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.141.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.141.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.141.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.142.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.142.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.142.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.142.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.142.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.142.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.143.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.143.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.143.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.143.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.143.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.143.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.144.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.144.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.144.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.144.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.144.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.144.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.145.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.145.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.145.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.145.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.145.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.145.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.146.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.146.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.146.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.146.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.146.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.146.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.147.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.147.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.147.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.147.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.147.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.147.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.148.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.148.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.148.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.148.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.148.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.148.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.149.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.149.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.149.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.149.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.149.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.149.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.150.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.150.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.150.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.150.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.150.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.150.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.151.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.151.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.151.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.151.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.151.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.151.down_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.152.gate_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.152.gate_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.152.up_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.152.up_proj.weight_scale_inv": "model-00027-of-000163.safetensors", "model.layers.12.mlp.experts.152.down_proj.weight": "model-00027-of-000163.safetensors", - "model.layers.12.mlp.experts.152.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.153.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.153.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.153.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.153.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.153.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.153.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.154.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.154.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.154.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.154.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.154.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.154.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.155.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.155.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.155.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.155.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.155.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.155.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.156.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.156.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.156.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.156.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.156.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.156.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.157.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.157.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.157.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.157.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.157.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.157.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.158.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.158.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.158.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.158.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.158.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.158.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.159.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.159.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.159.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.159.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.159.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.159.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.160.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.160.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.160.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.160.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.160.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.160.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.161.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.161.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.161.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.161.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.161.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.161.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.162.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.162.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.162.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.162.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.162.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.162.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.163.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.163.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.163.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.163.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.163.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.163.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.164.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.164.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.164.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.164.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.164.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.164.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.165.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.165.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.165.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.165.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.165.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.165.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.166.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.166.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.166.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.166.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.166.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.166.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.167.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.167.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.167.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.167.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.167.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.167.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.168.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.168.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.168.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.168.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.168.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.168.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.169.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.169.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.169.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.169.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.169.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.169.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.170.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.170.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.170.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.170.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.170.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.170.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.171.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.171.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.171.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.171.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.171.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.171.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.172.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.172.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.172.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.172.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.172.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.172.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.173.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.173.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.173.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.173.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.173.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.173.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.174.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.174.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.174.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.174.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.174.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.174.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.175.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.175.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.175.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.175.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.175.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.175.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.176.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.176.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.176.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.176.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.176.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.176.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.177.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.177.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.177.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.177.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.177.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.177.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.178.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.178.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.178.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.178.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.178.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.178.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.179.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.179.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.179.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.179.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.179.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.179.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.180.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.180.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.180.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.180.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.180.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.180.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.181.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.181.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.181.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.181.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.181.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.181.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.182.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.182.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.182.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.182.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.182.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.182.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.183.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.183.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.183.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.183.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.183.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.183.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.184.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.184.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.184.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.184.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.184.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.184.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.185.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.185.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.185.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.185.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.185.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.185.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.186.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.186.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.186.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.186.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.186.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.186.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.187.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.187.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.187.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.187.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.187.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.187.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.188.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.188.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.188.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.188.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.188.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.188.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.189.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.189.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.189.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.189.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.189.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.189.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.190.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.190.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.190.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.190.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.190.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.190.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.191.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.191.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.191.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.191.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.191.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.191.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.192.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.192.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.192.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.192.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.192.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.192.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.193.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.193.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.193.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.193.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.193.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.193.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.194.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.194.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.194.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.194.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.194.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.194.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.195.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.195.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.195.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.195.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.195.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.195.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.196.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.196.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.196.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.196.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.196.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.196.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.197.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.197.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.197.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.197.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.197.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.197.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.198.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.198.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.198.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.198.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.198.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.198.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.199.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.199.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.199.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.199.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.199.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.199.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.200.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.200.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.200.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.200.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.200.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.200.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.201.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.201.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.201.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.201.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.201.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.201.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.202.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.202.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.202.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.202.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.202.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.202.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.203.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.203.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.203.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.203.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.203.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.203.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.204.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.204.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.204.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.204.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.204.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.204.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.205.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.205.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.205.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.205.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.205.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.205.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.206.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.206.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.206.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.206.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.206.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.206.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.207.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.207.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.207.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.207.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.207.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.207.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.208.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.208.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.208.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.208.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.208.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.208.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.209.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.209.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.209.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.209.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.209.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.209.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.210.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.210.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.210.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.210.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.210.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.210.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.211.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.211.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.211.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.211.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.211.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.211.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.212.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.212.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.212.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.212.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.212.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.212.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.213.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.213.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.213.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.213.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.213.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.213.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.214.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.214.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.214.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.214.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.214.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.214.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.215.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.215.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.215.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.215.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.215.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.215.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.216.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.216.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.216.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.216.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.216.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.216.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.217.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.217.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.217.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.217.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.217.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.217.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.218.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.218.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.218.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.218.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.218.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.218.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.219.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.219.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.219.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.219.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.219.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.219.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.220.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.220.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.220.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.220.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.220.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.220.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.221.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.221.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.221.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.221.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.221.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.221.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.222.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.222.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.222.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.222.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.222.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.222.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.223.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.223.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.223.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.223.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.223.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.223.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.224.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.224.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.224.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.224.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.224.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.224.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.225.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.225.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.225.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.225.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.225.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.225.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.226.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.226.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.226.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.226.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.226.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.226.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.227.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.227.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.227.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.227.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.227.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.227.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.228.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.228.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.228.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.228.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.228.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.228.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.229.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.229.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.229.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.229.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.229.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.229.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.230.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.230.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.230.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.230.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.230.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.230.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.231.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.231.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.231.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.231.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.231.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.231.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.232.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.232.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.232.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.232.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.232.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.232.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.233.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.233.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.233.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.233.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.233.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.233.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.234.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.234.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.234.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.234.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.234.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.234.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.235.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.235.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.235.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.235.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.235.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.235.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.236.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.236.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.236.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.236.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.236.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.236.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.237.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.237.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.237.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.237.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.237.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.237.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.238.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.238.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.238.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.238.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.238.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.238.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.239.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.239.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.239.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.239.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.239.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.239.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.240.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.240.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.240.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.240.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.240.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.240.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.241.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.241.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.241.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.241.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.241.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.241.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.242.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.242.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.242.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.242.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.242.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.242.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.243.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.243.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.243.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.243.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.243.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.243.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.244.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.244.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.244.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.244.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.244.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.244.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.245.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.245.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.245.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.245.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.245.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.245.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.246.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.246.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.246.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.246.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.246.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.246.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.247.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.247.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.247.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.247.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.247.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.247.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.248.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.248.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.248.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.248.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.248.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.248.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.249.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.249.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.249.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.249.up_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.249.down_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.249.down_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.250.gate_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.250.gate_proj.weight_scale_inv": "model-00028-of-000163.safetensors", "model.layers.12.mlp.experts.250.up_proj.weight": "model-00028-of-000163.safetensors", - "model.layers.12.mlp.experts.250.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.250.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.250.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.251.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.251.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.251.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.251.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.251.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.251.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.252.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.252.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.252.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.252.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.252.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.252.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.253.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.253.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.253.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.253.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.253.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.253.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.254.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.254.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.254.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.254.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.254.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.254.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.255.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.255.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.255.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.255.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.mlp.experts.255.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.12.mlp.experts.255.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.12.input_layernorm.weight": "model-00029-of-000163.safetensors", "model.layers.12.post_attention_layernorm.weight": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.q_a_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.self_attn.q_a_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.q_a_layernorm.weight": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.q_b_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.self_attn.q_b_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.kv_a_proj_with_mqa.weight": "model-00029-of-000163.safetensors", - "model.layers.13.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.kv_a_layernorm.weight": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.kv_b_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.self_attn.kv_b_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.self_attn.o_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.self_attn.o_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.gate.weight": "model-00029-of-000163.safetensors", "model.layers.13.mlp.gate.e_score_correction_bias": "model-00029-of-000163.safetensors", "model.layers.13.mlp.shared_experts.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.shared_experts.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.shared_experts.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.shared_experts.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.shared_experts.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.0.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.0.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.0.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.0.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.0.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.0.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.1.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.1.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.1.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.1.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.1.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.1.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.2.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.2.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.2.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.2.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.2.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.2.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.3.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.3.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.3.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.3.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.3.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.3.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.4.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.4.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.4.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.4.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.4.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.4.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.5.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.5.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.5.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.5.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.5.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.5.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.6.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.6.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.6.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.6.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.6.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.6.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.7.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.7.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.7.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.7.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.7.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.7.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.8.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.8.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.8.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.8.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.8.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.8.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.9.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.9.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.9.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.9.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.9.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.9.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.10.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.10.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.10.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.10.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.10.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.10.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.11.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.11.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.11.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.11.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.11.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.11.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.12.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.12.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.12.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.12.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.12.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.12.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.13.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.13.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.13.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.13.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.13.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.13.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.14.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.14.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.14.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.14.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.14.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.14.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.15.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.15.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.15.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.15.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.15.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.15.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.16.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.16.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.16.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.16.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.16.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.16.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.17.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.17.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.17.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.17.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.17.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.17.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.18.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.18.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.18.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.18.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.18.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.18.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.19.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.19.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.19.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.19.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.19.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.19.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.20.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.20.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.20.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.20.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.20.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.20.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.21.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.21.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.21.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.21.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.21.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.21.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.22.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.22.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.22.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.22.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.22.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.22.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.23.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.23.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.23.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.23.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.23.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.23.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.24.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.24.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.24.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.24.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.24.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.24.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.25.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.25.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.25.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.25.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.25.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.25.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.26.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.26.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.26.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.26.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.26.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.26.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.27.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.27.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.27.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.27.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.27.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.27.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.28.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.28.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.28.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.28.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.28.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.28.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.29.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.29.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.29.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.29.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.29.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.29.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.30.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.30.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.30.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.30.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.30.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.30.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.31.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.31.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.31.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.31.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.31.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.31.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.32.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.32.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.32.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.32.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.32.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.32.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.33.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.33.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.33.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.33.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.33.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.33.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.34.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.34.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.34.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.34.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.34.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.34.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.35.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.35.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.35.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.35.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.35.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.35.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.36.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.36.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.36.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.36.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.36.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.36.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.37.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.37.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.37.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.37.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.37.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.37.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.38.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.38.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.38.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.38.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.38.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.38.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.39.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.39.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.39.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.39.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.39.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.39.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.40.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.40.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.40.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.40.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.40.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.40.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.41.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.41.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.41.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.41.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.41.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.41.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.42.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.42.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.42.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.42.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.42.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.42.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.43.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.43.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.43.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.43.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.43.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.43.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.44.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.44.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.44.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.44.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.44.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.44.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.45.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.45.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.45.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.45.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.45.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.45.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.46.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.46.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.46.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.46.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.46.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.46.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.47.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.47.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.47.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.47.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.47.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.47.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.48.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.48.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.48.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.48.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.48.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.48.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.49.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.49.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.49.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.49.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.49.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.49.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.50.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.50.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.50.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.50.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.50.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.50.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.51.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.51.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.51.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.51.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.51.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.51.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.52.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.52.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.52.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.52.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.52.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.52.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.53.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.53.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.53.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.53.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.53.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.53.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.54.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.54.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.54.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.54.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.54.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.54.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.55.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.55.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.55.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.55.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.55.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.55.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.56.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.56.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.56.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.56.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.56.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.56.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.57.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.57.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.57.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.57.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.57.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.57.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.58.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.58.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.58.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.58.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.58.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.58.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.59.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.59.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.59.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.59.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.59.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.59.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.60.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.60.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.60.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.60.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.60.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.60.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.61.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.61.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.61.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.61.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.61.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.61.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.62.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.62.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.62.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.62.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.62.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.62.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.63.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.63.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.63.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.63.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.63.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.63.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.64.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.64.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.64.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.64.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.64.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.64.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.65.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.65.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.65.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.65.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.65.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.65.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.66.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.66.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.66.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.66.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.66.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.66.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.67.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.67.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.67.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.67.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.67.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.67.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.68.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.68.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.68.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.68.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.68.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.68.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.69.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.69.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.69.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.69.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.69.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.69.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.70.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.70.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.70.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.70.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.70.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.70.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.71.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.71.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.71.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.71.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.71.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.71.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.72.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.72.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.72.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.72.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.72.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.72.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.73.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.73.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.73.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.73.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.73.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.73.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.74.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.74.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.74.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.74.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.74.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.74.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.75.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.75.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.75.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.75.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.75.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.75.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.76.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.76.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.76.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.76.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.76.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.76.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.77.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.77.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.77.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.77.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.77.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.77.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.78.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.78.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.78.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.78.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.78.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.78.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.79.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.79.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.79.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.79.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.79.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.79.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.80.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.80.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.80.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.80.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.80.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.80.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.81.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.81.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.81.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.81.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.81.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.81.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.82.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.82.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.82.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.82.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.82.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.82.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.83.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.83.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.83.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.83.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.83.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.83.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.84.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.84.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.84.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.84.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.84.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.84.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.85.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.85.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.85.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.85.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.85.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.85.down_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.86.gate_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.86.gate_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.86.up_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.86.up_proj.weight_scale_inv": "model-00029-of-000163.safetensors", "model.layers.13.mlp.experts.86.down_proj.weight": "model-00029-of-000163.safetensors", - "model.layers.13.mlp.experts.86.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.87.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.87.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.87.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.87.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.87.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.87.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.88.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.88.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.88.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.88.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.88.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.88.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.89.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.89.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.89.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.89.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.89.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.89.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.90.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.90.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.90.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.90.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.90.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.90.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.91.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.91.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.91.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.91.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.91.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.91.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.92.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.92.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.92.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.92.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.92.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.92.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.93.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.93.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.93.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.93.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.93.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.93.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.94.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.94.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.94.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.94.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.94.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.94.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.95.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.95.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.95.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.95.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.95.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.95.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.96.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.96.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.96.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.96.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.96.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.96.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.97.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.97.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.97.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.97.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.97.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.97.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.98.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.98.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.98.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.98.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.98.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.98.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.99.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.99.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.99.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.99.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.99.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.99.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.100.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.100.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.100.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.100.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.100.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.100.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.101.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.101.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.101.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.101.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.101.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.101.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.102.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.102.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.102.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.102.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.102.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.102.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.103.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.103.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.103.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.103.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.103.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.103.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.104.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.104.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.104.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.104.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.104.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.104.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.105.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.105.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.105.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.105.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.105.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.105.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.106.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.106.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.106.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.106.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.106.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.106.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.107.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.107.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.107.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.107.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.107.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.107.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.108.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.108.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.108.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.108.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.108.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.108.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.109.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.109.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.109.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.109.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.109.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.109.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.110.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.110.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.110.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.110.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.110.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.110.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.111.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.111.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.111.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.111.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.111.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.111.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.112.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.112.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.112.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.112.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.112.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.112.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.113.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.113.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.113.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.113.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.113.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.113.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.114.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.114.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.114.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.114.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.114.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.114.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.115.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.115.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.115.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.115.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.115.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.115.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.116.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.116.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.116.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.116.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.116.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.116.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.117.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.117.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.117.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.117.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.117.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.117.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.118.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.118.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.118.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.118.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.118.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.118.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.119.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.119.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.119.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.119.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.119.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.119.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.120.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.120.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.120.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.120.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.120.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.120.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.121.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.121.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.121.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.121.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.121.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.121.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.122.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.122.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.122.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.122.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.122.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.122.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.123.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.123.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.123.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.123.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.123.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.123.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.124.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.124.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.124.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.124.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.124.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.124.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.125.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.125.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.125.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.125.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.125.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.125.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.126.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.126.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.126.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.126.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.126.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.126.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.127.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.127.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.127.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.127.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.127.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.127.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.128.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.128.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.128.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.128.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.128.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.128.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.129.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.129.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.129.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.129.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.129.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.129.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.130.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.130.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.130.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.130.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.130.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.130.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.131.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.131.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.131.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.131.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.131.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.131.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.132.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.132.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.132.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.132.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.132.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.132.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.133.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.133.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.133.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.133.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.133.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.133.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.134.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.134.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.134.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.134.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.134.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.134.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.135.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.135.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.135.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.135.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.135.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.135.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.136.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.136.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.136.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.136.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.136.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.136.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.137.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.137.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.137.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.137.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.137.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.137.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.138.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.138.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.138.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.138.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.138.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.138.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.139.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.139.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.139.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.139.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.139.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.139.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.140.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.140.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.140.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.140.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.140.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.140.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.141.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.141.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.141.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.141.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.141.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.141.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.142.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.142.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.142.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.142.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.142.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.142.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.143.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.143.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.143.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.143.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.143.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.143.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.144.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.144.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.144.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.144.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.144.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.144.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.145.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.145.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.145.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.145.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.145.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.145.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.146.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.146.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.146.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.146.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.146.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.146.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.147.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.147.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.147.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.147.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.147.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.147.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.148.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.148.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.148.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.148.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.148.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.148.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.149.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.149.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.149.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.149.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.149.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.149.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.150.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.150.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.150.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.150.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.150.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.150.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.151.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.151.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.151.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.151.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.151.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.151.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.152.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.152.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.152.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.152.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.152.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.152.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.153.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.153.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.153.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.153.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.153.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.153.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.154.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.154.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.154.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.154.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.154.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.154.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.155.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.155.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.155.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.155.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.155.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.155.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.156.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.156.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.156.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.156.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.156.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.156.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.157.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.157.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.157.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.157.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.157.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.157.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.158.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.158.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.158.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.158.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.158.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.158.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.159.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.159.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.159.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.159.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.159.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.159.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.160.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.160.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.160.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.160.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.160.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.160.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.161.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.161.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.161.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.161.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.161.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.161.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.162.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.162.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.162.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.162.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.162.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.162.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.163.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.163.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.163.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.163.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.163.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.163.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.164.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.164.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.164.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.164.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.164.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.164.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.165.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.165.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.165.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.165.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.165.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.165.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.166.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.166.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.166.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.166.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.166.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.166.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.167.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.167.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.167.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.167.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.167.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.167.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.168.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.168.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.168.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.168.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.168.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.168.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.169.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.169.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.169.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.169.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.169.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.169.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.170.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.170.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.170.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.170.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.170.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.170.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.171.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.171.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.171.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.171.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.171.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.171.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.172.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.172.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.172.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.172.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.172.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.172.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.173.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.173.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.173.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.173.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.173.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.173.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.174.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.174.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.174.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.174.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.174.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.174.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.175.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.175.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.175.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.175.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.175.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.175.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.176.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.176.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.176.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.176.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.176.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.176.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.177.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.177.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.177.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.177.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.177.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.177.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.178.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.178.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.178.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.178.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.178.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.178.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.179.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.179.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.179.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.179.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.179.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.179.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.180.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.180.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.180.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.180.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.180.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.180.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.181.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.181.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.181.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.181.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.181.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.181.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.182.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.182.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.182.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.182.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.182.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.182.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.183.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.183.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.183.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.183.up_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.183.down_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.183.down_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.184.gate_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.184.gate_proj.weight_scale_inv": "model-00030-of-000163.safetensors", "model.layers.13.mlp.experts.184.up_proj.weight": "model-00030-of-000163.safetensors", - "model.layers.13.mlp.experts.184.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.184.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.184.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.185.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.185.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.185.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.185.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.185.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.185.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.186.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.186.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.186.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.186.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.186.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.186.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.187.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.187.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.187.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.187.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.187.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.187.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.188.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.188.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.188.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.188.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.188.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.188.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.189.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.189.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.189.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.189.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.189.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.189.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.190.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.190.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.190.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.190.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.190.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.190.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.191.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.191.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.191.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.191.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.191.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.191.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.192.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.192.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.192.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.192.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.192.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.192.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.193.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.193.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.193.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.193.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.193.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.193.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.194.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.194.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.194.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.194.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.194.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.194.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.195.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.195.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.195.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.195.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.195.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.195.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.196.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.196.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.196.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.196.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.196.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.196.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.197.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.197.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.197.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.197.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.197.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.197.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.198.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.198.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.198.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.198.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.198.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.198.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.199.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.199.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.199.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.199.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.199.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.199.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.200.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.200.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.200.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.200.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.200.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.200.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.201.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.201.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.201.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.201.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.201.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.201.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.202.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.202.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.202.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.202.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.202.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.202.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.203.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.203.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.203.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.203.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.203.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.203.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.204.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.204.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.204.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.204.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.204.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.204.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.205.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.205.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.205.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.205.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.205.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.205.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.206.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.206.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.206.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.206.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.206.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.206.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.207.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.207.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.207.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.207.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.207.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.207.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.208.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.208.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.208.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.208.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.208.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.208.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.209.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.209.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.209.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.209.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.209.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.209.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.210.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.210.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.210.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.210.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.210.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.210.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.211.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.211.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.211.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.211.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.211.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.211.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.212.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.212.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.212.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.212.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.212.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.212.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.213.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.213.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.213.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.213.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.213.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.213.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.214.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.214.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.214.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.214.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.214.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.214.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.215.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.215.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.215.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.215.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.215.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.215.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.216.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.216.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.216.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.216.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.216.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.216.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.217.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.217.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.217.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.217.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.217.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.217.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.218.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.218.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.218.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.218.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.218.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.218.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.219.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.219.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.219.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.219.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.219.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.219.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.220.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.220.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.220.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.220.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.220.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.220.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.221.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.221.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.221.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.221.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.221.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.221.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.222.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.222.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.222.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.222.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.222.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.222.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.223.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.223.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.223.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.223.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.223.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.223.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.224.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.224.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.224.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.224.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.224.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.224.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.225.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.225.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.225.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.225.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.225.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.225.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.226.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.226.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.226.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.226.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.226.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.226.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.227.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.227.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.227.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.227.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.227.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.227.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.228.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.228.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.228.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.228.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.228.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.228.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.229.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.229.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.229.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.229.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.229.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.229.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.230.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.230.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.230.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.230.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.230.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.230.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.231.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.231.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.231.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.231.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.231.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.231.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.232.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.232.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.232.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.232.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.232.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.232.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.233.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.233.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.233.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.233.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.233.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.233.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.234.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.234.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.234.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.234.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.234.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.234.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.235.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.235.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.235.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.235.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.235.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.235.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.236.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.236.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.236.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.236.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.236.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.236.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.237.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.237.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.237.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.237.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.237.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.237.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.238.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.238.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.238.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.238.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.238.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.238.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.239.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.239.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.239.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.239.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.239.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.239.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.240.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.240.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.240.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.240.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.240.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.240.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.241.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.241.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.241.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.241.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.241.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.241.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.242.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.242.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.242.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.242.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.242.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.242.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.243.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.243.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.243.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.243.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.243.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.243.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.244.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.244.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.244.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.244.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.244.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.244.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.245.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.245.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.245.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.245.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.245.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.245.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.246.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.246.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.246.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.246.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.246.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.246.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.247.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.247.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.247.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.247.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.247.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.247.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.248.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.248.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.248.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.248.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.248.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.248.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.249.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.249.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.249.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.249.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.249.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.249.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.250.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.250.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.250.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.250.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.250.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.250.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.251.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.251.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.251.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.251.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.251.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.251.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.252.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.252.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.252.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.252.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.252.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.252.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.253.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.253.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.253.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.253.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.253.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.253.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.254.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.254.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.254.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.254.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.254.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.254.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.255.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.255.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.255.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.255.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.mlp.experts.255.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.13.mlp.experts.255.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.13.input_layernorm.weight": "model-00031-of-000163.safetensors", "model.layers.13.post_attention_layernorm.weight": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.q_a_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.self_attn.q_a_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.q_a_layernorm.weight": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.q_b_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.self_attn.q_b_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.kv_a_proj_with_mqa.weight": "model-00031-of-000163.safetensors", - "model.layers.14.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.kv_a_layernorm.weight": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.kv_b_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.self_attn.kv_b_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.self_attn.o_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.self_attn.o_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.gate.weight": "model-00031-of-000163.safetensors", "model.layers.14.mlp.gate.e_score_correction_bias": "model-00031-of-000163.safetensors", "model.layers.14.mlp.shared_experts.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.shared_experts.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.shared_experts.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.shared_experts.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.shared_experts.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.0.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.0.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.0.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.0.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.0.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.0.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.1.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.1.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.1.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.1.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.1.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.1.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.2.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.2.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.2.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.2.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.2.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.2.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.3.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.3.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.3.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.3.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.3.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.3.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.4.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.4.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.4.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.4.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.4.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.4.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.5.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.5.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.5.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.5.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.5.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.5.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.6.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.6.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.6.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.6.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.6.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.6.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.7.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.7.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.7.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.7.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.7.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.7.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.8.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.8.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.8.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.8.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.8.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.8.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.9.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.9.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.9.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.9.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.9.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.9.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.10.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.10.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.10.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.10.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.10.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.10.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.11.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.11.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.11.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.11.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.11.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.11.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.12.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.12.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.12.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.12.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.12.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.12.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.13.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.13.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.13.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.13.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.13.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.13.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.14.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.14.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.14.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.14.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.14.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.14.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.15.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.15.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.15.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.15.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.15.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.15.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.16.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.16.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.16.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.16.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.16.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.16.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.17.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.17.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.17.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.17.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.17.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.17.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.18.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.18.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.18.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.18.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.18.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.18.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.19.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.19.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.19.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.19.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.19.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.19.down_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.20.gate_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.20.gate_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.20.up_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.20.up_proj.weight_scale_inv": "model-00031-of-000163.safetensors", "model.layers.14.mlp.experts.20.down_proj.weight": "model-00031-of-000163.safetensors", - "model.layers.14.mlp.experts.20.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.21.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.21.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.21.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.21.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.21.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.21.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.22.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.22.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.22.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.22.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.22.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.22.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.23.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.23.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.23.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.23.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.23.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.23.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.24.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.24.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.24.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.24.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.24.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.24.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.25.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.25.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.25.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.25.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.25.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.25.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.26.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.26.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.26.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.26.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.26.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.26.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.27.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.27.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.27.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.27.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.27.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.27.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.28.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.28.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.28.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.28.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.28.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.28.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.29.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.29.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.29.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.29.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.29.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.29.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.30.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.30.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.30.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.30.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.30.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.30.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.31.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.31.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.31.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.31.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.31.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.31.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.32.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.32.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.32.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.32.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.32.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.32.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.33.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.33.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.33.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.33.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.33.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.33.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.34.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.34.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.34.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.34.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.34.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.34.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.35.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.35.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.35.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.35.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.35.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.35.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.36.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.36.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.36.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.36.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.36.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.36.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.37.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.37.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.37.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.37.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.37.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.37.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.38.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.38.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.38.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.38.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.38.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.38.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.39.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.39.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.39.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.39.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.39.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.39.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.40.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.40.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.40.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.40.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.40.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.40.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.41.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.41.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.41.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.41.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.41.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.41.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.42.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.42.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.42.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.42.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.42.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.42.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.43.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.43.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.43.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.43.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.43.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.43.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.44.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.44.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.44.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.44.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.44.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.44.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.45.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.45.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.45.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.45.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.45.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.45.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.46.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.46.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.46.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.46.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.46.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.46.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.47.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.47.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.47.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.47.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.47.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.47.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.48.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.48.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.48.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.48.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.48.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.48.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.49.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.49.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.49.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.49.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.49.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.49.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.50.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.50.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.50.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.50.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.50.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.50.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.51.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.51.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.51.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.51.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.51.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.51.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.52.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.52.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.52.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.52.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.52.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.52.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.53.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.53.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.53.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.53.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.53.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.53.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.54.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.54.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.54.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.54.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.54.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.54.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.55.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.55.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.55.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.55.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.55.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.55.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.56.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.56.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.56.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.56.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.56.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.56.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.57.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.57.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.57.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.57.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.57.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.57.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.58.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.58.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.58.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.58.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.58.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.58.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.59.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.59.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.59.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.59.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.59.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.59.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.60.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.60.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.60.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.60.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.60.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.60.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.61.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.61.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.61.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.61.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.61.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.61.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.62.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.62.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.62.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.62.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.62.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.62.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.63.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.63.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.63.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.63.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.63.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.63.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.64.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.64.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.64.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.64.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.64.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.64.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.65.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.65.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.65.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.65.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.65.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.65.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.66.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.66.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.66.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.66.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.66.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.66.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.67.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.67.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.67.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.67.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.67.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.67.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.68.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.68.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.68.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.68.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.68.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.68.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.69.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.69.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.69.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.69.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.69.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.69.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.70.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.70.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.70.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.70.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.70.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.70.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.71.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.71.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.71.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.71.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.71.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.71.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.72.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.72.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.72.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.72.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.72.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.72.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.73.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.73.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.73.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.73.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.73.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.73.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.74.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.74.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.74.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.74.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.74.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.74.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.75.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.75.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.75.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.75.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.75.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.75.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.76.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.76.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.76.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.76.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.76.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.76.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.77.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.77.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.77.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.77.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.77.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.77.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.78.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.78.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.78.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.78.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.78.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.78.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.79.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.79.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.79.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.79.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.79.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.79.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.80.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.80.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.80.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.80.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.80.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.80.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.81.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.81.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.81.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.81.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.81.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.81.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.82.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.82.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.82.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.82.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.82.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.82.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.83.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.83.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.83.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.83.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.83.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.83.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.84.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.84.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.84.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.84.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.84.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.84.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.85.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.85.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.85.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.85.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.85.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.85.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.86.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.86.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.86.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.86.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.86.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.86.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.87.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.87.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.87.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.87.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.87.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.87.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.88.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.88.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.88.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.88.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.88.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.88.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.89.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.89.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.89.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.89.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.89.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.89.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.90.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.90.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.90.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.90.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.90.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.90.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.91.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.91.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.91.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.91.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.91.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.91.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.92.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.92.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.92.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.92.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.92.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.92.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.93.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.93.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.93.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.93.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.93.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.93.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.94.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.94.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.94.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.94.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.94.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.94.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.95.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.95.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.95.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.95.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.95.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.95.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.96.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.96.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.96.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.96.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.96.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.96.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.97.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.97.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.97.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.97.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.97.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.97.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.98.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.98.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.98.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.98.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.98.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.98.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.99.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.99.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.99.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.99.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.99.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.99.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.100.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.100.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.100.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.100.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.100.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.100.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.101.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.101.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.101.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.101.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.101.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.101.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.102.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.102.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.102.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.102.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.102.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.102.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.103.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.103.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.103.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.103.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.103.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.103.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.104.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.104.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.104.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.104.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.104.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.104.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.105.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.105.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.105.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.105.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.105.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.105.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.106.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.106.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.106.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.106.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.106.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.106.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.107.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.107.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.107.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.107.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.107.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.107.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.108.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.108.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.108.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.108.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.108.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.108.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.109.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.109.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.109.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.109.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.109.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.109.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.110.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.110.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.110.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.110.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.110.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.110.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.111.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.111.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.111.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.111.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.111.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.111.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.112.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.112.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.112.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.112.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.112.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.112.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.113.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.113.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.113.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.113.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.113.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.113.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.114.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.114.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.114.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.114.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.114.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.114.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.115.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.115.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.115.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.115.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.115.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.115.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.116.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.116.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.116.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.116.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.116.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.116.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.117.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.117.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.117.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.117.up_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.117.down_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.117.down_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.118.gate_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.118.gate_proj.weight_scale_inv": "model-00032-of-000163.safetensors", "model.layers.14.mlp.experts.118.up_proj.weight": "model-00032-of-000163.safetensors", - "model.layers.14.mlp.experts.118.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.118.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.118.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.119.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.119.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.119.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.119.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.119.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.119.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.120.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.120.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.120.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.120.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.120.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.120.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.121.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.121.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.121.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.121.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.121.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.121.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.122.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.122.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.122.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.122.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.122.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.122.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.123.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.123.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.123.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.123.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.123.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.123.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.124.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.124.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.124.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.124.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.124.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.124.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.125.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.125.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.125.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.125.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.125.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.125.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.126.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.126.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.126.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.126.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.126.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.126.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.127.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.127.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.127.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.127.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.127.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.127.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.128.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.128.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.128.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.128.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.128.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.128.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.129.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.129.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.129.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.129.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.129.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.129.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.130.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.130.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.130.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.130.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.130.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.130.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.131.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.131.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.131.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.131.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.131.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.131.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.132.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.132.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.132.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.132.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.132.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.132.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.133.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.133.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.133.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.133.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.133.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.133.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.134.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.134.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.134.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.134.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.134.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.134.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.135.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.135.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.135.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.135.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.135.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.135.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.136.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.136.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.136.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.136.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.136.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.136.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.137.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.137.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.137.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.137.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.137.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.137.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.138.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.138.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.138.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.138.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.138.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.138.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.139.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.139.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.139.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.139.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.139.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.139.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.140.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.140.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.140.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.140.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.140.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.140.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.141.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.141.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.141.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.141.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.141.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.141.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.142.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.142.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.142.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.142.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.142.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.142.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.143.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.143.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.143.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.143.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.143.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.143.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.144.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.144.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.144.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.144.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.144.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.144.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.145.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.145.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.145.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.145.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.145.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.145.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.146.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.146.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.146.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.146.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.146.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.146.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.147.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.147.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.147.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.147.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.147.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.147.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.148.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.148.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.148.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.148.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.148.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.148.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.149.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.149.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.149.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.149.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.149.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.149.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.150.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.150.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.150.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.150.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.150.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.150.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.151.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.151.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.151.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.151.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.151.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.151.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.152.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.152.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.152.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.152.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.152.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.152.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.153.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.153.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.153.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.153.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.153.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.153.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.154.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.154.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.154.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.154.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.154.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.154.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.155.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.155.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.155.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.155.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.155.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.155.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.156.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.156.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.156.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.156.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.156.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.156.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.157.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.157.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.157.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.157.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.157.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.157.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.158.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.158.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.158.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.158.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.158.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.158.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.159.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.159.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.159.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.159.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.159.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.159.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.160.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.160.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.160.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.160.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.160.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.160.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.161.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.161.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.161.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.161.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.161.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.161.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.162.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.162.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.162.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.162.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.162.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.162.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.163.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.163.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.163.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.163.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.163.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.163.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.164.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.164.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.164.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.164.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.164.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.164.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.165.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.165.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.165.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.165.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.165.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.165.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.166.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.166.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.166.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.166.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.166.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.166.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.167.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.167.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.167.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.167.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.167.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.167.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.168.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.168.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.168.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.168.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.168.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.168.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.169.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.169.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.169.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.169.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.169.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.169.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.170.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.170.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.170.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.170.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.170.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.170.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.171.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.171.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.171.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.171.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.171.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.171.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.172.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.172.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.172.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.172.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.172.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.172.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.173.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.173.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.173.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.173.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.173.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.173.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.174.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.174.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.174.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.174.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.174.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.174.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.175.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.175.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.175.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.175.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.175.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.175.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.176.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.176.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.176.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.176.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.176.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.176.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.177.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.177.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.177.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.177.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.177.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.177.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.178.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.178.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.178.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.178.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.178.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.178.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.179.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.179.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.179.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.179.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.179.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.179.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.180.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.180.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.180.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.180.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.180.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.180.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.181.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.181.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.181.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.181.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.181.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.181.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.182.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.182.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.182.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.182.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.182.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.182.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.183.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.183.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.183.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.183.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.183.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.183.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.184.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.184.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.184.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.184.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.184.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.184.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.185.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.185.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.185.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.185.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.185.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.185.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.186.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.186.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.186.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.186.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.186.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.186.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.187.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.187.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.187.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.187.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.187.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.187.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.188.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.188.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.188.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.188.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.188.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.188.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.189.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.189.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.189.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.189.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.189.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.189.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.190.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.190.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.190.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.190.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.190.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.190.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.191.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.191.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.191.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.191.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.191.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.191.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.192.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.192.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.192.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.192.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.192.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.192.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.193.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.193.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.193.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.193.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.193.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.193.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.194.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.194.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.194.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.194.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.194.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.194.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.195.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.195.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.195.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.195.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.195.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.195.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.196.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.196.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.196.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.196.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.196.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.196.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.197.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.197.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.197.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.197.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.197.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.197.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.198.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.198.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.198.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.198.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.198.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.198.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.199.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.199.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.199.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.199.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.199.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.199.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.200.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.200.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.200.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.200.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.200.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.200.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.201.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.201.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.201.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.201.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.201.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.201.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.202.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.202.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.202.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.202.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.202.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.202.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.203.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.203.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.203.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.203.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.203.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.203.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.204.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.204.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.204.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.204.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.204.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.204.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.205.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.205.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.205.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.205.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.205.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.205.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.206.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.206.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.206.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.206.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.206.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.206.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.207.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.207.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.207.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.207.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.207.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.207.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.208.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.208.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.208.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.208.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.208.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.208.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.209.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.209.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.209.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.209.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.209.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.209.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.210.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.210.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.210.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.210.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.210.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.210.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.211.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.211.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.211.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.211.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.211.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.211.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.212.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.212.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.212.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.212.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.212.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.212.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.213.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.213.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.213.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.213.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.213.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.213.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.214.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.214.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.214.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.214.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.214.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.214.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.215.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.215.gate_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.215.up_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.215.up_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.215.down_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.215.down_proj.weight_scale_inv": "model-00033-of-000163.safetensors", "model.layers.14.mlp.experts.216.gate_proj.weight": "model-00033-of-000163.safetensors", - "model.layers.14.mlp.experts.216.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.216.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.216.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.216.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.216.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.217.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.217.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.217.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.217.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.217.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.217.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.218.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.218.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.218.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.218.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.218.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.218.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.219.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.219.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.219.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.219.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.219.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.219.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.220.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.220.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.220.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.220.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.220.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.220.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.221.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.221.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.221.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.221.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.221.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.221.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.222.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.222.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.222.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.222.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.222.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.222.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.223.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.223.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.223.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.223.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.223.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.223.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.224.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.224.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.224.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.224.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.224.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.224.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.225.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.225.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.225.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.225.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.225.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.225.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.226.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.226.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.226.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.226.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.226.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.226.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.227.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.227.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.227.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.227.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.227.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.227.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.228.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.228.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.228.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.228.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.228.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.228.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.229.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.229.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.229.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.229.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.229.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.229.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.230.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.230.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.230.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.230.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.230.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.230.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.231.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.231.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.231.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.231.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.231.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.231.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.232.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.232.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.232.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.232.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.232.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.232.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.233.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.233.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.233.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.233.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.233.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.233.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.234.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.234.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.234.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.234.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.234.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.234.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.235.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.235.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.235.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.235.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.235.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.235.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.236.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.236.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.236.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.236.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.236.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.236.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.237.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.237.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.237.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.237.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.237.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.237.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.238.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.238.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.238.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.238.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.238.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.238.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.239.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.239.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.239.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.239.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.239.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.239.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.240.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.240.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.240.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.240.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.240.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.240.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.241.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.241.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.241.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.241.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.241.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.241.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.242.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.242.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.242.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.242.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.242.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.242.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.243.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.243.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.243.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.243.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.243.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.243.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.244.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.244.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.244.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.244.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.244.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.244.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.245.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.245.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.245.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.245.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.245.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.245.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.246.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.246.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.246.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.246.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.246.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.246.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.247.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.247.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.247.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.247.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.247.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.247.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.248.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.248.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.248.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.248.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.248.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.248.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.249.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.249.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.249.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.249.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.249.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.249.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.250.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.250.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.250.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.250.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.250.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.250.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.251.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.251.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.251.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.251.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.251.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.251.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.252.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.252.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.252.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.252.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.252.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.252.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.253.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.253.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.253.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.253.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.253.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.253.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.254.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.254.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.254.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.254.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.254.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.254.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.255.gate_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.255.gate_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.255.up_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.255.up_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.mlp.experts.255.down_proj.weight": "model-00034-of-000163.safetensors", - "model.layers.14.mlp.experts.255.down_proj.weight_scale_inv": "model-00034-of-000163.safetensors", "model.layers.14.input_layernorm.weight": "model-00034-of-000163.safetensors", "model.layers.14.post_attention_layernorm.weight": "model-00034-of-000163.safetensors", "model.layers.15.self_attn.q_a_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.self_attn.q_a_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.q_a_layernorm.weight": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.q_b_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.self_attn.q_b_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.kv_a_proj_with_mqa.weight": "model-00035-of-000163.safetensors", - "model.layers.15.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.kv_a_layernorm.weight": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.kv_b_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.self_attn.kv_b_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.self_attn.o_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.self_attn.o_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.gate.weight": "model-00035-of-000163.safetensors", "model.layers.15.mlp.gate.e_score_correction_bias": "model-00035-of-000163.safetensors", "model.layers.15.mlp.shared_experts.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.shared_experts.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.shared_experts.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.shared_experts.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.shared_experts.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.0.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.0.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.0.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.0.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.0.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.0.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.1.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.1.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.1.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.1.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.1.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.1.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.2.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.2.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.2.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.2.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.2.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.2.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.3.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.3.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.3.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.3.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.3.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.3.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.4.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.4.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.4.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.4.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.4.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.4.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.5.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.5.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.5.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.5.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.5.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.5.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.6.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.6.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.6.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.6.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.6.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.6.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.7.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.7.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.7.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.7.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.7.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.7.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.8.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.8.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.8.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.8.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.8.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.8.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.9.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.9.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.9.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.9.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.9.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.9.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.10.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.10.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.10.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.10.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.10.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.10.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.11.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.11.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.11.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.11.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.11.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.11.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.12.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.12.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.12.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.12.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.12.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.12.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.13.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.13.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.13.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.13.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.13.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.13.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.14.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.14.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.14.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.14.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.14.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.14.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.15.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.15.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.15.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.15.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.15.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.15.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.16.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.16.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.16.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.16.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.16.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.16.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.17.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.17.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.17.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.17.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.17.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.17.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.18.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.18.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.18.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.18.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.18.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.18.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.19.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.19.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.19.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.19.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.19.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.19.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.20.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.20.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.20.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.20.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.20.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.20.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.21.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.21.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.21.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.21.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.21.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.21.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.22.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.22.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.22.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.22.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.22.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.22.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.23.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.23.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.23.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.23.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.23.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.23.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.24.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.24.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.24.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.24.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.24.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.24.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.25.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.25.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.25.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.25.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.25.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.25.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.26.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.26.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.26.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.26.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.26.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.26.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.27.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.27.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.27.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.27.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.27.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.27.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.28.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.28.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.28.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.28.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.28.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.28.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.29.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.29.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.29.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.29.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.29.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.29.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.30.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.30.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.30.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.30.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.30.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.30.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.31.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.31.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.31.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.31.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.31.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.31.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.32.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.32.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.32.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.32.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.32.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.32.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.33.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.33.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.33.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.33.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.33.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.33.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.34.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.34.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.34.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.34.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.34.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.34.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.35.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.35.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.35.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.35.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.35.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.35.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.36.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.36.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.36.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.36.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.36.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.36.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.37.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.37.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.37.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.37.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.37.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.37.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.38.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.38.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.38.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.38.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.38.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.38.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.39.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.39.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.39.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.39.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.39.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.39.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.40.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.40.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.40.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.40.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.40.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.40.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.41.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.41.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.41.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.41.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.41.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.41.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.42.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.42.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.42.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.42.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.42.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.42.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.43.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.43.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.43.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.43.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.43.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.43.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.44.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.44.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.44.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.44.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.44.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.44.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.45.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.45.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.45.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.45.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.45.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.45.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.46.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.46.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.46.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.46.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.46.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.46.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.47.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.47.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.47.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.47.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.47.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.47.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.48.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.48.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.48.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.48.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.48.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.48.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.49.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.49.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.49.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.49.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.49.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.49.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.50.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.50.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.50.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.50.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.50.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.50.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.51.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.51.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.51.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.51.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.51.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.51.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.52.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.52.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.52.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.52.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.52.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.52.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.53.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.53.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.53.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.53.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.53.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.53.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.54.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.54.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.54.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.54.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.54.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.54.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.55.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.55.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.55.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.55.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.55.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.55.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.56.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.56.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.56.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.56.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.56.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.56.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.57.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.57.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.57.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.57.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.57.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.57.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.58.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.58.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.58.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.58.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.58.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.58.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.59.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.59.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.59.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.59.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.59.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.59.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.60.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.60.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.60.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.60.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.60.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.60.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.61.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.61.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.61.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.61.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.61.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.61.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.62.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.62.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.62.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.62.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.62.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.62.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.63.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.63.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.63.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.63.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.63.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.63.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.64.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.64.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.64.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.64.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.64.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.64.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.65.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.65.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.65.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.65.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.65.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.65.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.66.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.66.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.66.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.66.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.66.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.66.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.67.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.67.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.67.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.67.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.67.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.67.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.68.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.68.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.68.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.68.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.68.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.68.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.69.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.69.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.69.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.69.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.69.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.69.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.70.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.70.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.70.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.70.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.70.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.70.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.71.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.71.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.71.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.71.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.71.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.71.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.72.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.72.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.72.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.72.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.72.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.72.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.73.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.73.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.73.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.73.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.73.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.73.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.74.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.74.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.74.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.74.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.74.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.74.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.75.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.75.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.75.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.75.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.75.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.75.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.76.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.76.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.76.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.76.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.76.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.76.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.77.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.77.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.77.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.77.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.77.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.77.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.78.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.78.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.78.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.78.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.78.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.78.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.79.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.79.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.79.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.79.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.79.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.79.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.80.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.80.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.80.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.80.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.80.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.80.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.81.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.81.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.81.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.81.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.81.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.81.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.82.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.82.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.82.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.82.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.82.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.82.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.83.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.83.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.83.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.83.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.83.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.83.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.84.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.84.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.84.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.84.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.84.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.84.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.85.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.85.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.85.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.85.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.85.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.85.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.86.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.86.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.86.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.86.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.86.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.86.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.87.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.87.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.87.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.87.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.87.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.87.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.88.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.88.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.88.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.88.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.88.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.88.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.89.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.89.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.89.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.89.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.89.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.89.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.90.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.90.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.90.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.90.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.90.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.90.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.91.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.91.gate_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.91.up_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.91.up_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.91.down_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.91.down_proj.weight_scale_inv": "model-00035-of-000163.safetensors", "model.layers.15.mlp.experts.92.gate_proj.weight": "model-00035-of-000163.safetensors", - "model.layers.15.mlp.experts.92.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.92.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.92.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.92.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.92.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.93.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.93.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.93.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.93.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.93.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.93.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.94.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.94.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.94.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.94.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.94.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.94.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.95.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.95.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.95.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.95.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.95.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.95.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.96.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.96.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.96.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.96.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.96.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.96.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.97.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.97.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.97.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.97.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.97.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.97.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.98.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.98.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.98.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.98.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.98.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.98.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.99.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.99.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.99.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.99.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.99.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.99.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.100.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.100.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.100.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.100.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.100.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.100.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.101.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.101.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.101.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.101.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.101.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.101.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.102.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.102.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.102.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.102.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.102.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.102.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.103.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.103.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.103.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.103.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.103.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.103.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.104.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.104.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.104.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.104.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.104.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.104.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.105.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.105.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.105.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.105.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.105.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.105.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.106.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.106.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.106.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.106.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.106.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.106.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.107.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.107.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.107.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.107.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.107.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.107.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.108.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.108.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.108.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.108.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.108.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.108.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.109.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.109.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.109.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.109.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.109.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.109.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.110.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.110.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.110.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.110.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.110.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.110.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.111.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.111.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.111.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.111.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.111.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.111.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.112.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.112.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.112.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.112.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.112.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.112.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.113.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.113.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.113.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.113.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.113.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.113.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.114.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.114.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.114.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.114.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.114.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.114.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.115.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.115.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.115.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.115.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.115.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.115.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.116.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.116.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.116.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.116.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.116.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.116.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.117.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.117.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.117.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.117.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.117.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.117.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.118.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.118.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.118.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.118.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.118.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.118.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.119.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.119.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.119.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.119.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.119.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.119.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.120.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.120.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.120.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.120.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.120.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.120.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.121.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.121.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.121.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.121.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.121.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.121.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.122.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.122.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.122.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.122.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.122.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.122.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.123.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.123.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.123.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.123.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.123.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.123.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.124.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.124.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.124.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.124.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.124.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.124.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.125.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.125.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.125.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.125.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.125.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.125.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.126.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.126.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.126.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.126.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.126.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.126.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.127.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.127.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.127.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.127.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.127.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.127.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.128.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.128.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.128.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.128.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.128.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.128.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.129.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.129.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.129.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.129.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.129.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.129.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.130.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.130.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.130.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.130.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.130.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.130.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.131.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.131.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.131.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.131.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.131.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.131.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.132.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.132.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.132.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.132.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.132.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.132.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.133.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.133.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.133.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.133.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.133.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.133.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.134.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.134.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.134.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.134.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.134.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.134.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.135.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.135.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.135.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.135.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.135.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.135.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.136.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.136.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.136.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.136.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.136.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.136.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.137.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.137.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.137.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.137.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.137.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.137.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.138.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.138.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.138.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.138.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.138.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.138.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.139.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.139.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.139.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.139.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.139.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.139.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.140.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.140.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.140.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.140.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.140.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.140.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.141.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.141.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.141.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.141.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.141.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.141.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.142.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.142.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.142.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.142.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.142.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.142.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.143.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.143.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.143.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.143.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.143.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.143.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.144.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.144.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.144.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.144.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.144.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.144.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.145.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.145.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.145.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.145.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.145.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.145.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.146.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.146.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.146.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.146.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.146.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.146.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.147.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.147.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.147.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.147.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.147.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.147.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.148.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.148.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.148.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.148.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.148.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.148.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.149.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.149.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.149.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.149.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.149.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.149.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.150.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.150.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.150.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.150.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.150.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.150.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.151.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.151.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.151.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.151.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.151.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.151.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.152.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.152.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.152.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.152.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.152.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.152.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.153.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.153.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.153.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.153.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.153.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.153.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.154.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.154.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.154.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.154.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.154.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.154.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.155.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.155.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.155.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.155.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.155.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.155.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.156.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.156.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.156.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.156.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.156.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.156.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.157.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.157.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.157.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.157.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.157.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.157.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.158.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.158.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.158.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.158.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.158.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.158.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.159.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.159.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.159.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.159.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.159.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.159.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.160.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.160.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.160.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.160.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.160.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.160.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.161.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.161.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.161.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.161.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.161.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.161.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.162.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.162.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.162.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.162.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.162.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.162.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.163.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.163.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.163.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.163.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.163.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.163.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.164.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.164.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.164.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.164.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.164.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.164.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.165.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.165.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.165.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.165.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.165.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.165.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.166.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.166.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.166.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.166.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.166.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.166.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.167.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.167.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.167.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.167.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.167.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.167.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.168.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.168.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.168.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.168.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.168.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.168.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.169.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.169.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.169.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.169.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.169.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.169.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.170.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.170.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.170.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.170.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.170.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.170.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.171.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.171.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.171.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.171.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.171.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.171.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.172.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.172.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.172.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.172.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.172.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.172.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.173.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.173.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.173.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.173.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.173.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.173.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.174.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.174.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.174.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.174.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.174.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.174.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.175.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.175.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.175.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.175.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.175.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.175.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.176.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.176.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.176.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.176.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.176.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.176.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.177.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.177.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.177.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.177.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.177.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.177.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.178.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.178.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.178.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.178.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.178.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.178.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.179.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.179.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.179.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.179.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.179.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.179.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.180.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.180.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.180.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.180.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.180.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.180.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.181.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.181.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.181.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.181.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.181.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.181.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.182.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.182.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.182.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.182.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.182.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.182.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.183.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.183.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.183.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.183.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.183.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.183.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.184.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.184.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.184.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.184.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.184.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.184.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.185.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.185.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.185.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.185.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.185.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.185.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.186.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.186.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.186.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.186.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.186.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.186.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.187.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.187.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.187.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.187.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.187.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.187.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.188.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.188.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.188.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.188.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.188.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.188.down_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.189.gate_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.189.gate_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.189.up_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.189.up_proj.weight_scale_inv": "model-00036-of-000163.safetensors", "model.layers.15.mlp.experts.189.down_proj.weight": "model-00036-of-000163.safetensors", - "model.layers.15.mlp.experts.189.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.190.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.190.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.190.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.190.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.190.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.190.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.191.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.191.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.191.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.191.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.191.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.191.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.192.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.192.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.192.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.192.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.192.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.192.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.193.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.193.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.193.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.193.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.193.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.193.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.194.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.194.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.194.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.194.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.194.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.194.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.195.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.195.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.195.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.195.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.195.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.195.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.196.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.196.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.196.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.196.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.196.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.196.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.197.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.197.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.197.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.197.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.197.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.197.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.198.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.198.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.198.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.198.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.198.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.198.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.199.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.199.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.199.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.199.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.199.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.199.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.200.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.200.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.200.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.200.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.200.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.200.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.201.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.201.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.201.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.201.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.201.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.201.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.202.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.202.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.202.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.202.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.202.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.202.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.203.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.203.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.203.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.203.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.203.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.203.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.204.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.204.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.204.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.204.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.204.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.204.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.205.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.205.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.205.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.205.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.205.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.205.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.206.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.206.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.206.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.206.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.206.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.206.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.207.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.207.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.207.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.207.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.207.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.207.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.208.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.208.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.208.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.208.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.208.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.208.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.209.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.209.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.209.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.209.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.209.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.209.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.210.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.210.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.210.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.210.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.210.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.210.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.211.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.211.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.211.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.211.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.211.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.211.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.212.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.212.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.212.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.212.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.212.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.212.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.213.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.213.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.213.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.213.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.213.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.213.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.214.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.214.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.214.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.214.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.214.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.214.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.215.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.215.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.215.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.215.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.215.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.215.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.216.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.216.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.216.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.216.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.216.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.216.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.217.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.217.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.217.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.217.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.217.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.217.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.218.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.218.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.218.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.218.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.218.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.218.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.219.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.219.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.219.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.219.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.219.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.219.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.220.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.220.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.220.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.220.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.220.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.220.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.221.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.221.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.221.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.221.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.221.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.221.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.222.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.222.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.222.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.222.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.222.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.222.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.223.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.223.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.223.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.223.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.223.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.223.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.224.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.224.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.224.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.224.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.224.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.224.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.225.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.225.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.225.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.225.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.225.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.225.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.226.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.226.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.226.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.226.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.226.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.226.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.227.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.227.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.227.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.227.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.227.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.227.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.228.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.228.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.228.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.228.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.228.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.228.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.229.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.229.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.229.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.229.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.229.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.229.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.230.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.230.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.230.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.230.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.230.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.230.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.231.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.231.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.231.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.231.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.231.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.231.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.232.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.232.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.232.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.232.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.232.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.232.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.233.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.233.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.233.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.233.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.233.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.233.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.234.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.234.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.234.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.234.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.234.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.234.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.235.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.235.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.235.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.235.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.235.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.235.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.236.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.236.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.236.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.236.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.236.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.236.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.237.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.237.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.237.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.237.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.237.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.237.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.238.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.238.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.238.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.238.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.238.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.238.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.239.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.239.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.239.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.239.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.239.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.239.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.240.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.240.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.240.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.240.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.240.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.240.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.241.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.241.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.241.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.241.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.241.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.241.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.242.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.242.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.242.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.242.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.242.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.242.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.243.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.243.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.243.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.243.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.243.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.243.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.244.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.244.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.244.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.244.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.244.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.244.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.245.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.245.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.245.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.245.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.245.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.245.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.246.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.246.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.246.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.246.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.246.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.246.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.247.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.247.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.247.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.247.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.247.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.247.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.248.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.248.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.248.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.248.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.248.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.248.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.249.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.249.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.249.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.249.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.249.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.249.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.250.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.250.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.250.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.250.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.250.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.250.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.251.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.251.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.251.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.251.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.251.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.251.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.252.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.252.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.252.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.252.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.252.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.252.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.253.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.253.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.253.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.253.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.253.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.253.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.254.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.254.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.254.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.254.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.254.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.254.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.255.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.255.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.255.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.255.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.mlp.experts.255.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.15.mlp.experts.255.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.15.input_layernorm.weight": "model-00037-of-000163.safetensors", "model.layers.15.post_attention_layernorm.weight": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.q_a_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.self_attn.q_a_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.q_a_layernorm.weight": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.q_b_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.self_attn.q_b_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.kv_a_proj_with_mqa.weight": "model-00037-of-000163.safetensors", - "model.layers.16.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.kv_a_layernorm.weight": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.kv_b_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.self_attn.kv_b_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.self_attn.o_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.self_attn.o_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.gate.weight": "model-00037-of-000163.safetensors", "model.layers.16.mlp.gate.e_score_correction_bias": "model-00037-of-000163.safetensors", "model.layers.16.mlp.shared_experts.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.shared_experts.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.shared_experts.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.shared_experts.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.shared_experts.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.0.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.0.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.0.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.0.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.0.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.0.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.1.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.1.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.1.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.1.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.1.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.1.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.2.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.2.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.2.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.2.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.2.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.2.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.3.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.3.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.3.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.3.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.3.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.3.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.4.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.4.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.4.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.4.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.4.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.4.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.5.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.5.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.5.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.5.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.5.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.5.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.6.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.6.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.6.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.6.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.6.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.6.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.7.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.7.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.7.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.7.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.7.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.7.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.8.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.8.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.8.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.8.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.8.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.8.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.9.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.9.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.9.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.9.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.9.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.9.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.10.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.10.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.10.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.10.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.10.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.10.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.11.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.11.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.11.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.11.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.11.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.11.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.12.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.12.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.12.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.12.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.12.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.12.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.13.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.13.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.13.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.13.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.13.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.13.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.14.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.14.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.14.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.14.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.14.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.14.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.15.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.15.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.15.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.15.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.15.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.15.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.16.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.16.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.16.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.16.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.16.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.16.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.17.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.17.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.17.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.17.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.17.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.17.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.18.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.18.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.18.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.18.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.18.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.18.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.19.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.19.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.19.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.19.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.19.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.19.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.20.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.20.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.20.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.20.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.20.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.20.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.21.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.21.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.21.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.21.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.21.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.21.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.22.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.22.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.22.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.22.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.22.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.22.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.23.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.23.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.23.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.23.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.23.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.23.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.24.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.24.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.24.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.24.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.24.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.24.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.25.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.25.gate_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.25.up_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.25.up_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.25.down_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.25.down_proj.weight_scale_inv": "model-00037-of-000163.safetensors", "model.layers.16.mlp.experts.26.gate_proj.weight": "model-00037-of-000163.safetensors", - "model.layers.16.mlp.experts.26.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.26.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.26.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.26.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.26.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.27.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.27.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.27.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.27.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.27.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.27.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.28.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.28.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.28.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.28.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.28.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.28.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.29.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.29.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.29.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.29.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.29.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.29.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.30.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.30.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.30.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.30.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.30.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.30.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.31.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.31.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.31.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.31.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.31.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.31.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.32.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.32.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.32.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.32.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.32.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.32.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.33.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.33.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.33.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.33.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.33.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.33.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.34.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.34.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.34.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.34.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.34.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.34.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.35.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.35.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.35.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.35.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.35.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.35.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.36.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.36.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.36.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.36.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.36.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.36.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.37.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.37.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.37.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.37.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.37.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.37.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.38.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.38.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.38.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.38.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.38.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.38.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.39.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.39.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.39.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.39.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.39.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.39.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.40.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.40.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.40.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.40.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.40.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.40.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.41.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.41.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.41.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.41.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.41.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.41.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.42.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.42.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.42.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.42.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.42.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.42.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.43.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.43.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.43.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.43.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.43.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.43.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.44.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.44.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.44.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.44.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.44.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.44.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.45.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.45.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.45.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.45.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.45.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.45.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.46.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.46.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.46.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.46.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.46.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.46.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.47.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.47.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.47.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.47.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.47.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.47.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.48.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.48.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.48.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.48.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.48.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.48.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.49.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.49.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.49.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.49.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.49.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.49.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.50.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.50.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.50.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.50.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.50.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.50.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.51.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.51.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.51.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.51.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.51.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.51.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.52.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.52.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.52.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.52.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.52.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.52.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.53.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.53.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.53.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.53.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.53.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.53.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.54.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.54.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.54.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.54.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.54.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.54.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.55.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.55.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.55.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.55.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.55.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.55.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.56.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.56.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.56.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.56.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.56.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.56.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.57.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.57.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.57.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.57.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.57.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.57.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.58.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.58.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.58.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.58.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.58.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.58.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.59.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.59.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.59.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.59.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.59.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.59.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.60.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.60.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.60.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.60.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.60.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.60.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.61.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.61.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.61.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.61.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.61.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.61.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.62.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.62.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.62.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.62.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.62.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.62.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.63.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.63.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.63.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.63.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.63.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.63.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.64.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.64.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.64.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.64.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.64.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.64.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.65.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.65.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.65.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.65.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.65.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.65.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.66.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.66.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.66.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.66.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.66.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.66.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.67.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.67.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.67.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.67.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.67.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.67.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.68.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.68.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.68.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.68.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.68.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.68.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.69.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.69.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.69.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.69.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.69.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.69.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.70.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.70.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.70.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.70.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.70.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.70.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.71.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.71.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.71.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.71.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.71.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.71.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.72.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.72.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.72.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.72.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.72.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.72.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.73.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.73.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.73.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.73.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.73.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.73.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.74.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.74.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.74.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.74.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.74.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.74.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.75.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.75.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.75.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.75.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.75.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.75.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.76.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.76.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.76.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.76.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.76.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.76.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.77.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.77.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.77.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.77.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.77.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.77.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.78.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.78.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.78.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.78.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.78.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.78.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.79.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.79.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.79.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.79.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.79.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.79.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.80.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.80.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.80.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.80.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.80.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.80.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.81.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.81.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.81.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.81.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.81.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.81.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.82.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.82.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.82.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.82.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.82.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.82.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.83.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.83.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.83.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.83.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.83.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.83.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.84.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.84.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.84.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.84.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.84.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.84.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.85.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.85.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.85.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.85.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.85.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.85.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.86.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.86.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.86.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.86.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.86.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.86.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.87.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.87.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.87.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.87.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.87.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.87.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.88.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.88.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.88.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.88.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.88.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.88.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.89.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.89.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.89.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.89.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.89.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.89.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.90.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.90.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.90.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.90.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.90.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.90.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.91.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.91.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.91.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.91.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.91.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.91.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.92.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.92.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.92.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.92.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.92.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.92.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.93.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.93.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.93.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.93.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.93.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.93.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.94.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.94.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.94.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.94.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.94.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.94.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.95.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.95.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.95.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.95.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.95.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.95.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.96.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.96.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.96.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.96.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.96.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.96.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.97.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.97.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.97.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.97.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.97.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.97.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.98.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.98.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.98.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.98.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.98.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.98.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.99.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.99.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.99.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.99.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.99.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.99.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.100.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.100.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.100.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.100.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.100.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.100.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.101.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.101.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.101.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.101.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.101.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.101.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.102.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.102.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.102.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.102.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.102.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.102.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.103.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.103.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.103.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.103.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.103.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.103.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.104.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.104.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.104.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.104.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.104.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.104.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.105.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.105.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.105.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.105.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.105.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.105.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.106.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.106.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.106.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.106.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.106.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.106.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.107.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.107.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.107.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.107.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.107.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.107.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.108.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.108.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.108.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.108.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.108.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.108.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.109.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.109.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.109.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.109.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.109.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.109.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.110.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.110.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.110.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.110.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.110.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.110.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.111.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.111.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.111.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.111.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.111.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.111.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.112.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.112.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.112.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.112.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.112.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.112.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.113.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.113.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.113.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.113.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.113.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.113.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.114.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.114.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.114.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.114.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.114.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.114.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.115.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.115.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.115.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.115.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.115.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.115.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.116.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.116.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.116.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.116.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.116.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.116.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.117.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.117.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.117.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.117.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.117.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.117.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.118.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.118.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.118.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.118.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.118.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.118.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.119.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.119.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.119.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.119.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.119.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.119.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.120.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.120.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.120.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.120.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.120.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.120.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.121.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.121.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.121.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.121.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.121.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.121.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.122.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.122.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.122.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.122.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.122.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.122.down_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.123.gate_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.123.gate_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.123.up_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.123.up_proj.weight_scale_inv": "model-00038-of-000163.safetensors", "model.layers.16.mlp.experts.123.down_proj.weight": "model-00038-of-000163.safetensors", - "model.layers.16.mlp.experts.123.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.124.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.124.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.124.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.124.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.124.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.124.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.125.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.125.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.125.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.125.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.125.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.125.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.126.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.126.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.126.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.126.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.126.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.126.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.127.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.127.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.127.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.127.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.127.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.127.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.128.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.128.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.128.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.128.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.128.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.128.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.129.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.129.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.129.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.129.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.129.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.129.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.130.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.130.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.130.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.130.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.130.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.130.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.131.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.131.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.131.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.131.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.131.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.131.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.132.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.132.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.132.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.132.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.132.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.132.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.133.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.133.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.133.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.133.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.133.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.133.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.134.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.134.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.134.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.134.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.134.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.134.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.135.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.135.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.135.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.135.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.135.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.135.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.136.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.136.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.136.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.136.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.136.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.136.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.137.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.137.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.137.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.137.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.137.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.137.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.138.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.138.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.138.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.138.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.138.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.138.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.139.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.139.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.139.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.139.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.139.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.139.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.140.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.140.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.140.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.140.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.140.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.140.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.141.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.141.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.141.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.141.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.141.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.141.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.142.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.142.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.142.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.142.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.142.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.142.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.143.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.143.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.143.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.143.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.143.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.143.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.144.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.144.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.144.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.144.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.144.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.144.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.145.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.145.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.145.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.145.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.145.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.145.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.146.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.146.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.146.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.146.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.146.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.146.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.147.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.147.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.147.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.147.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.147.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.147.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.148.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.148.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.148.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.148.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.148.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.148.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.149.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.149.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.149.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.149.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.149.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.149.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.150.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.150.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.150.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.150.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.150.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.150.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.151.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.151.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.151.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.151.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.151.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.151.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.152.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.152.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.152.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.152.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.152.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.152.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.153.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.153.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.153.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.153.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.153.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.153.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.154.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.154.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.154.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.154.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.154.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.154.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.155.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.155.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.155.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.155.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.155.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.155.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.156.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.156.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.156.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.156.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.156.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.156.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.157.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.157.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.157.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.157.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.157.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.157.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.158.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.158.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.158.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.158.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.158.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.158.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.159.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.159.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.159.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.159.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.159.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.159.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.160.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.160.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.160.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.160.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.160.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.160.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.161.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.161.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.161.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.161.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.161.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.161.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.162.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.162.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.162.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.162.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.162.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.162.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.163.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.163.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.163.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.163.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.163.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.163.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.164.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.164.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.164.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.164.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.164.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.164.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.165.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.165.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.165.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.165.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.165.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.165.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.166.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.166.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.166.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.166.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.166.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.166.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.167.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.167.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.167.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.167.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.167.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.167.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.168.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.168.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.168.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.168.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.168.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.168.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.169.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.169.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.169.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.169.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.169.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.169.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.170.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.170.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.170.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.170.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.170.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.170.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.171.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.171.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.171.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.171.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.171.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.171.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.172.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.172.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.172.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.172.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.172.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.172.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.173.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.173.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.173.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.173.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.173.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.173.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.174.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.174.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.174.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.174.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.174.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.174.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.175.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.175.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.175.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.175.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.175.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.175.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.176.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.176.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.176.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.176.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.176.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.176.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.177.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.177.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.177.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.177.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.177.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.177.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.178.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.178.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.178.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.178.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.178.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.178.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.179.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.179.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.179.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.179.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.179.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.179.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.180.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.180.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.180.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.180.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.180.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.180.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.181.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.181.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.181.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.181.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.181.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.181.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.182.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.182.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.182.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.182.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.182.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.182.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.183.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.183.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.183.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.183.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.183.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.183.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.184.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.184.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.184.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.184.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.184.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.184.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.185.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.185.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.185.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.185.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.185.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.185.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.186.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.186.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.186.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.186.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.186.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.186.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.187.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.187.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.187.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.187.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.187.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.187.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.188.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.188.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.188.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.188.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.188.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.188.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.189.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.189.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.189.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.189.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.189.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.189.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.190.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.190.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.190.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.190.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.190.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.190.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.191.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.191.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.191.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.191.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.191.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.191.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.192.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.192.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.192.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.192.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.192.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.192.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.193.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.193.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.193.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.193.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.193.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.193.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.194.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.194.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.194.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.194.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.194.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.194.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.195.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.195.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.195.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.195.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.195.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.195.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.196.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.196.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.196.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.196.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.196.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.196.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.197.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.197.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.197.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.197.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.197.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.197.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.198.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.198.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.198.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.198.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.198.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.198.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.199.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.199.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.199.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.199.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.199.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.199.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.200.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.200.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.200.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.200.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.200.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.200.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.201.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.201.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.201.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.201.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.201.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.201.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.202.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.202.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.202.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.202.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.202.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.202.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.203.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.203.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.203.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.203.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.203.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.203.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.204.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.204.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.204.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.204.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.204.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.204.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.205.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.205.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.205.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.205.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.205.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.205.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.206.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.206.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.206.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.206.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.206.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.206.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.207.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.207.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.207.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.207.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.207.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.207.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.208.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.208.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.208.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.208.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.208.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.208.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.209.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.209.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.209.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.209.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.209.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.209.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.210.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.210.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.210.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.210.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.210.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.210.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.211.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.211.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.211.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.211.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.211.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.211.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.212.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.212.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.212.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.212.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.212.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.212.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.213.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.213.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.213.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.213.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.213.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.213.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.214.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.214.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.214.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.214.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.214.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.214.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.215.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.215.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.215.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.215.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.215.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.215.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.216.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.216.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.216.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.216.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.216.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.216.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.217.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.217.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.217.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.217.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.217.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.217.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.218.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.218.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.218.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.218.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.218.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.218.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.219.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.219.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.219.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.219.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.219.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.219.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.220.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.220.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.220.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.220.up_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.220.down_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.220.down_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.221.gate_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.221.gate_proj.weight_scale_inv": "model-00039-of-000163.safetensors", "model.layers.16.mlp.experts.221.up_proj.weight": "model-00039-of-000163.safetensors", - "model.layers.16.mlp.experts.221.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.221.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.221.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.222.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.222.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.222.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.222.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.222.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.222.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.223.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.223.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.223.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.223.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.223.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.223.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.224.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.224.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.224.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.224.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.224.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.224.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.225.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.225.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.225.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.225.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.225.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.225.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.226.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.226.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.226.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.226.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.226.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.226.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.227.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.227.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.227.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.227.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.227.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.227.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.228.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.228.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.228.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.228.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.228.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.228.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.229.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.229.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.229.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.229.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.229.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.229.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.230.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.230.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.230.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.230.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.230.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.230.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.231.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.231.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.231.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.231.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.231.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.231.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.232.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.232.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.232.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.232.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.232.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.232.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.233.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.233.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.233.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.233.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.233.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.233.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.234.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.234.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.234.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.234.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.234.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.234.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.235.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.235.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.235.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.235.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.235.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.235.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.236.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.236.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.236.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.236.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.236.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.236.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.237.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.237.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.237.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.237.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.237.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.237.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.238.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.238.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.238.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.238.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.238.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.238.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.239.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.239.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.239.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.239.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.239.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.239.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.240.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.240.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.240.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.240.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.240.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.240.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.241.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.241.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.241.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.241.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.241.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.241.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.242.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.242.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.242.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.242.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.242.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.242.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.243.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.243.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.243.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.243.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.243.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.243.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.244.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.244.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.244.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.244.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.244.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.244.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.245.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.245.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.245.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.245.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.245.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.245.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.246.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.246.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.246.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.246.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.246.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.246.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.247.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.247.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.247.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.247.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.247.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.247.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.248.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.248.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.248.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.248.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.248.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.248.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.249.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.249.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.249.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.249.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.249.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.249.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.250.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.250.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.250.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.250.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.250.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.250.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.251.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.251.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.251.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.251.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.251.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.251.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.252.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.252.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.252.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.252.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.252.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.252.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.253.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.253.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.253.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.253.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.253.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.253.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.254.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.254.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.254.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.254.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.254.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.254.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.255.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.255.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.255.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.255.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.mlp.experts.255.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.16.mlp.experts.255.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.16.input_layernorm.weight": "model-00040-of-000163.safetensors", "model.layers.16.post_attention_layernorm.weight": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.q_a_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.self_attn.q_a_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.q_a_layernorm.weight": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.q_b_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.self_attn.q_b_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.kv_a_proj_with_mqa.weight": "model-00040-of-000163.safetensors", - "model.layers.17.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.kv_a_layernorm.weight": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.kv_b_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.self_attn.kv_b_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.self_attn.o_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.self_attn.o_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.gate.weight": "model-00040-of-000163.safetensors", "model.layers.17.mlp.gate.e_score_correction_bias": "model-00040-of-000163.safetensors", "model.layers.17.mlp.shared_experts.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.shared_experts.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.shared_experts.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.shared_experts.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.shared_experts.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.0.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.0.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.0.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.0.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.0.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.0.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.1.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.1.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.1.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.1.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.1.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.1.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.2.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.2.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.2.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.2.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.2.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.2.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.3.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.3.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.3.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.3.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.3.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.3.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.4.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.4.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.4.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.4.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.4.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.4.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.5.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.5.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.5.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.5.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.5.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.5.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.6.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.6.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.6.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.6.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.6.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.6.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.7.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.7.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.7.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.7.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.7.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.7.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.8.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.8.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.8.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.8.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.8.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.8.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.9.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.9.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.9.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.9.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.9.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.9.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.10.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.10.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.10.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.10.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.10.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.10.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.11.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.11.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.11.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.11.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.11.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.11.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.12.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.12.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.12.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.12.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.12.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.12.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.13.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.13.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.13.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.13.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.13.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.13.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.14.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.14.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.14.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.14.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.14.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.14.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.15.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.15.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.15.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.15.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.15.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.15.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.16.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.16.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.16.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.16.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.16.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.16.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.17.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.17.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.17.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.17.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.17.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.17.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.18.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.18.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.18.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.18.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.18.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.18.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.19.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.19.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.19.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.19.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.19.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.19.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.20.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.20.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.20.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.20.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.20.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.20.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.21.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.21.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.21.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.21.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.21.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.21.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.22.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.22.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.22.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.22.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.22.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.22.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.23.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.23.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.23.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.23.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.23.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.23.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.24.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.24.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.24.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.24.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.24.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.24.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.25.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.25.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.25.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.25.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.25.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.25.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.26.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.26.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.26.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.26.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.26.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.26.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.27.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.27.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.27.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.27.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.27.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.27.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.28.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.28.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.28.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.28.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.28.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.28.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.29.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.29.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.29.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.29.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.29.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.29.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.30.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.30.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.30.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.30.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.30.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.30.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.31.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.31.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.31.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.31.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.31.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.31.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.32.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.32.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.32.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.32.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.32.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.32.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.33.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.33.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.33.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.33.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.33.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.33.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.34.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.34.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.34.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.34.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.34.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.34.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.35.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.35.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.35.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.35.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.35.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.35.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.36.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.36.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.36.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.36.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.36.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.36.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.37.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.37.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.37.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.37.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.37.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.37.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.38.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.38.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.38.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.38.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.38.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.38.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.39.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.39.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.39.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.39.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.39.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.39.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.40.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.40.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.40.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.40.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.40.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.40.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.41.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.41.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.41.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.41.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.41.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.41.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.42.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.42.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.42.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.42.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.42.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.42.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.43.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.43.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.43.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.43.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.43.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.43.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.44.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.44.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.44.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.44.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.44.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.44.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.45.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.45.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.45.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.45.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.45.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.45.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.46.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.46.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.46.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.46.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.46.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.46.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.47.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.47.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.47.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.47.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.47.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.47.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.48.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.48.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.48.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.48.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.48.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.48.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.49.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.49.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.49.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.49.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.49.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.49.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.50.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.50.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.50.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.50.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.50.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.50.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.51.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.51.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.51.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.51.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.51.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.51.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.52.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.52.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.52.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.52.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.52.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.52.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.53.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.53.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.53.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.53.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.53.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.53.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.54.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.54.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.54.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.54.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.54.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.54.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.55.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.55.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.55.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.55.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.55.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.55.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.56.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.56.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.56.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.56.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.56.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.56.down_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.57.gate_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.57.gate_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.57.up_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.57.up_proj.weight_scale_inv": "model-00040-of-000163.safetensors", "model.layers.17.mlp.experts.57.down_proj.weight": "model-00040-of-000163.safetensors", - "model.layers.17.mlp.experts.57.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.58.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.58.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.58.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.58.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.58.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.58.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.59.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.59.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.59.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.59.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.59.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.59.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.60.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.60.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.60.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.60.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.60.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.60.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.61.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.61.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.61.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.61.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.61.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.61.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.62.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.62.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.62.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.62.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.62.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.62.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.63.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.63.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.63.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.63.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.63.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.63.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.64.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.64.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.64.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.64.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.64.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.64.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.65.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.65.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.65.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.65.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.65.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.65.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.66.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.66.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.66.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.66.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.66.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.66.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.67.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.67.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.67.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.67.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.67.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.67.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.68.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.68.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.68.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.68.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.68.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.68.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.69.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.69.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.69.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.69.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.69.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.69.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.70.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.70.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.70.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.70.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.70.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.70.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.71.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.71.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.71.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.71.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.71.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.71.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.72.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.72.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.72.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.72.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.72.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.72.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.73.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.73.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.73.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.73.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.73.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.73.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.74.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.74.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.74.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.74.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.74.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.74.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.75.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.75.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.75.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.75.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.75.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.75.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.76.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.76.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.76.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.76.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.76.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.76.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.77.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.77.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.77.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.77.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.77.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.77.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.78.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.78.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.78.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.78.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.78.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.78.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.79.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.79.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.79.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.79.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.79.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.79.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.80.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.80.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.80.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.80.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.80.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.80.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.81.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.81.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.81.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.81.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.81.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.81.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.82.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.82.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.82.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.82.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.82.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.82.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.83.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.83.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.83.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.83.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.83.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.83.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.84.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.84.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.84.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.84.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.84.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.84.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.85.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.85.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.85.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.85.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.85.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.85.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.86.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.86.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.86.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.86.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.86.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.86.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.87.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.87.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.87.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.87.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.87.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.87.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.88.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.88.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.88.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.88.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.88.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.88.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.89.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.89.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.89.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.89.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.89.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.89.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.90.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.90.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.90.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.90.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.90.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.90.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.91.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.91.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.91.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.91.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.91.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.91.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.92.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.92.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.92.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.92.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.92.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.92.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.93.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.93.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.93.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.93.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.93.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.93.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.94.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.94.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.94.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.94.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.94.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.94.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.95.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.95.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.95.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.95.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.95.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.95.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.96.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.96.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.96.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.96.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.96.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.96.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.97.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.97.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.97.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.97.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.97.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.97.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.98.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.98.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.98.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.98.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.98.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.98.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.99.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.99.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.99.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.99.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.99.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.99.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.100.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.100.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.100.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.100.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.100.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.100.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.101.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.101.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.101.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.101.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.101.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.101.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.102.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.102.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.102.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.102.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.102.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.102.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.103.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.103.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.103.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.103.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.103.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.103.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.104.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.104.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.104.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.104.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.104.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.104.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.105.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.105.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.105.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.105.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.105.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.105.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.106.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.106.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.106.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.106.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.106.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.106.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.107.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.107.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.107.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.107.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.107.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.107.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.108.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.108.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.108.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.108.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.108.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.108.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.109.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.109.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.109.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.109.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.109.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.109.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.110.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.110.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.110.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.110.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.110.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.110.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.111.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.111.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.111.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.111.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.111.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.111.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.112.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.112.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.112.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.112.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.112.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.112.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.113.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.113.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.113.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.113.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.113.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.113.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.114.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.114.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.114.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.114.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.114.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.114.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.115.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.115.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.115.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.115.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.115.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.115.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.116.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.116.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.116.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.116.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.116.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.116.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.117.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.117.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.117.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.117.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.117.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.117.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.118.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.118.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.118.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.118.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.118.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.118.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.119.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.119.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.119.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.119.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.119.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.119.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.120.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.120.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.120.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.120.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.120.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.120.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.121.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.121.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.121.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.121.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.121.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.121.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.122.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.122.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.122.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.122.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.122.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.122.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.123.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.123.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.123.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.123.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.123.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.123.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.124.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.124.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.124.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.124.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.124.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.124.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.125.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.125.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.125.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.125.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.125.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.125.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.126.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.126.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.126.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.126.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.126.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.126.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.127.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.127.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.127.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.127.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.127.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.127.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.128.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.128.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.128.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.128.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.128.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.128.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.129.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.129.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.129.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.129.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.129.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.129.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.130.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.130.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.130.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.130.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.130.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.130.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.131.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.131.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.131.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.131.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.131.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.131.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.132.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.132.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.132.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.132.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.132.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.132.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.133.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.133.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.133.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.133.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.133.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.133.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.134.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.134.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.134.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.134.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.134.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.134.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.135.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.135.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.135.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.135.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.135.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.135.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.136.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.136.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.136.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.136.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.136.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.136.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.137.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.137.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.137.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.137.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.137.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.137.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.138.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.138.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.138.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.138.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.138.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.138.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.139.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.139.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.139.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.139.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.139.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.139.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.140.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.140.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.140.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.140.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.140.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.140.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.141.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.141.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.141.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.141.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.141.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.141.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.142.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.142.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.142.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.142.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.142.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.142.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.143.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.143.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.143.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.143.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.143.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.143.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.144.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.144.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.144.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.144.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.144.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.144.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.145.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.145.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.145.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.145.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.145.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.145.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.146.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.146.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.146.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.146.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.146.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.146.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.147.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.147.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.147.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.147.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.147.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.147.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.148.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.148.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.148.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.148.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.148.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.148.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.149.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.149.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.149.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.149.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.149.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.149.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.150.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.150.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.150.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.150.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.150.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.150.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.151.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.151.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.151.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.151.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.151.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.151.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.152.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.152.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.152.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.152.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.152.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.152.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.153.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.153.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.153.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.153.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.153.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.153.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.154.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.154.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.154.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.154.up_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.154.down_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.154.down_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.155.gate_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.155.gate_proj.weight_scale_inv": "model-00041-of-000163.safetensors", "model.layers.17.mlp.experts.155.up_proj.weight": "model-00041-of-000163.safetensors", - "model.layers.17.mlp.experts.155.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.155.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.155.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.156.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.156.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.156.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.156.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.156.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.156.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.157.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.157.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.157.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.157.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.157.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.157.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.158.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.158.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.158.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.158.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.158.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.158.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.159.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.159.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.159.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.159.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.159.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.159.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.160.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.160.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.160.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.160.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.160.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.160.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.161.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.161.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.161.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.161.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.161.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.161.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.162.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.162.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.162.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.162.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.162.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.162.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.163.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.163.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.163.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.163.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.163.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.163.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.164.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.164.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.164.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.164.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.164.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.164.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.165.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.165.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.165.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.165.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.165.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.165.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.166.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.166.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.166.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.166.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.166.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.166.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.167.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.167.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.167.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.167.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.167.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.167.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.168.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.168.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.168.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.168.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.168.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.168.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.169.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.169.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.169.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.169.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.169.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.169.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.170.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.170.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.170.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.170.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.170.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.170.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.171.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.171.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.171.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.171.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.171.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.171.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.172.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.172.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.172.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.172.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.172.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.172.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.173.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.173.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.173.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.173.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.173.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.173.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.174.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.174.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.174.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.174.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.174.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.174.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.175.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.175.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.175.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.175.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.175.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.175.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.176.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.176.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.176.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.176.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.176.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.176.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.177.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.177.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.177.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.177.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.177.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.177.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.178.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.178.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.178.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.178.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.178.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.178.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.179.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.179.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.179.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.179.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.179.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.179.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.180.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.180.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.180.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.180.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.180.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.180.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.181.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.181.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.181.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.181.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.181.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.181.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.182.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.182.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.182.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.182.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.182.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.182.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.183.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.183.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.183.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.183.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.183.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.183.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.184.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.184.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.184.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.184.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.184.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.184.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.185.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.185.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.185.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.185.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.185.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.185.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.186.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.186.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.186.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.186.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.186.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.186.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.187.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.187.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.187.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.187.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.187.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.187.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.188.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.188.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.188.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.188.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.188.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.188.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.189.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.189.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.189.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.189.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.189.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.189.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.190.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.190.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.190.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.190.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.190.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.190.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.191.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.191.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.191.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.191.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.191.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.191.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.192.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.192.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.192.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.192.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.192.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.192.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.193.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.193.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.193.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.193.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.193.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.193.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.194.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.194.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.194.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.194.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.194.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.194.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.195.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.195.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.195.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.195.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.195.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.195.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.196.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.196.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.196.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.196.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.196.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.196.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.197.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.197.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.197.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.197.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.197.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.197.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.198.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.198.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.198.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.198.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.198.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.198.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.199.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.199.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.199.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.199.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.199.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.199.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.200.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.200.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.200.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.200.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.200.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.200.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.201.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.201.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.201.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.201.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.201.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.201.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.202.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.202.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.202.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.202.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.202.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.202.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.203.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.203.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.203.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.203.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.203.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.203.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.204.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.204.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.204.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.204.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.204.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.204.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.205.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.205.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.205.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.205.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.205.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.205.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.206.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.206.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.206.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.206.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.206.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.206.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.207.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.207.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.207.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.207.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.207.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.207.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.208.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.208.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.208.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.208.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.208.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.208.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.209.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.209.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.209.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.209.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.209.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.209.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.210.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.210.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.210.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.210.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.210.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.210.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.211.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.211.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.211.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.211.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.211.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.211.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.212.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.212.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.212.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.212.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.212.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.212.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.213.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.213.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.213.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.213.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.213.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.213.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.214.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.214.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.214.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.214.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.214.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.214.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.215.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.215.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.215.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.215.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.215.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.215.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.216.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.216.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.216.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.216.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.216.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.216.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.217.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.217.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.217.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.217.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.217.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.217.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.218.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.218.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.218.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.218.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.218.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.218.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.219.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.219.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.219.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.219.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.219.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.219.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.220.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.220.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.220.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.220.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.220.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.220.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.221.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.221.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.221.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.221.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.221.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.221.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.222.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.222.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.222.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.222.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.222.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.222.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.223.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.223.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.223.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.223.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.223.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.223.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.224.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.224.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.224.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.224.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.224.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.224.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.225.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.225.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.225.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.225.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.225.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.225.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.226.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.226.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.226.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.226.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.226.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.226.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.227.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.227.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.227.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.227.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.227.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.227.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.228.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.228.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.228.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.228.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.228.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.228.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.229.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.229.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.229.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.229.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.229.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.229.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.230.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.230.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.230.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.230.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.230.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.230.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.231.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.231.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.231.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.231.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.231.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.231.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.232.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.232.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.232.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.232.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.232.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.232.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.233.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.233.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.233.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.233.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.233.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.233.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.234.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.234.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.234.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.234.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.234.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.234.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.235.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.235.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.235.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.235.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.235.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.235.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.236.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.236.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.236.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.236.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.236.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.236.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.237.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.237.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.237.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.237.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.237.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.237.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.238.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.238.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.238.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.238.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.238.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.238.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.239.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.239.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.239.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.239.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.239.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.239.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.240.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.240.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.240.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.240.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.240.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.240.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.241.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.241.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.241.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.241.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.241.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.241.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.242.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.242.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.242.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.242.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.242.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.242.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.243.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.243.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.243.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.243.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.243.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.243.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.244.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.244.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.244.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.244.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.244.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.244.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.245.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.245.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.245.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.245.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.245.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.245.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.246.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.246.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.246.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.246.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.246.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.246.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.247.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.247.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.247.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.247.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.247.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.247.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.248.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.248.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.248.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.248.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.248.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.248.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.249.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.249.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.249.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.249.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.249.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.249.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.250.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.250.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.250.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.250.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.250.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.250.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.251.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.251.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.251.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.251.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.251.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.251.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.252.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.252.gate_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.252.up_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.252.up_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.252.down_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.252.down_proj.weight_scale_inv": "model-00042-of-000163.safetensors", "model.layers.17.mlp.experts.253.gate_proj.weight": "model-00042-of-000163.safetensors", - "model.layers.17.mlp.experts.253.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.253.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.253.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.253.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.253.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.254.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.254.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.254.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.254.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.254.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.254.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.255.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.255.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.255.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.255.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.mlp.experts.255.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.17.mlp.experts.255.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.17.input_layernorm.weight": "model-00043-of-000163.safetensors", "model.layers.17.post_attention_layernorm.weight": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.q_a_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.self_attn.q_a_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.q_a_layernorm.weight": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.q_b_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.self_attn.q_b_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.kv_a_proj_with_mqa.weight": "model-00043-of-000163.safetensors", - "model.layers.18.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.kv_a_layernorm.weight": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.kv_b_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.self_attn.kv_b_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.self_attn.o_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.self_attn.o_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.gate.weight": "model-00043-of-000163.safetensors", "model.layers.18.mlp.gate.e_score_correction_bias": "model-00043-of-000163.safetensors", "model.layers.18.mlp.shared_experts.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.shared_experts.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.shared_experts.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.shared_experts.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.shared_experts.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.0.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.0.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.0.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.0.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.0.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.0.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.1.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.1.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.1.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.1.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.1.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.1.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.2.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.2.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.2.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.2.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.2.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.2.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.3.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.3.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.3.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.3.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.3.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.3.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.4.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.4.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.4.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.4.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.4.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.4.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.5.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.5.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.5.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.5.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.5.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.5.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.6.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.6.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.6.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.6.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.6.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.6.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.7.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.7.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.7.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.7.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.7.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.7.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.8.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.8.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.8.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.8.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.8.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.8.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.9.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.9.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.9.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.9.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.9.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.9.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.10.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.10.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.10.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.10.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.10.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.10.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.11.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.11.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.11.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.11.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.11.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.11.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.12.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.12.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.12.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.12.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.12.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.12.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.13.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.13.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.13.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.13.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.13.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.13.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.14.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.14.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.14.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.14.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.14.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.14.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.15.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.15.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.15.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.15.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.15.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.15.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.16.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.16.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.16.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.16.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.16.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.16.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.17.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.17.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.17.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.17.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.17.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.17.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.18.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.18.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.18.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.18.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.18.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.18.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.19.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.19.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.19.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.19.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.19.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.19.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.20.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.20.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.20.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.20.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.20.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.20.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.21.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.21.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.21.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.21.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.21.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.21.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.22.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.22.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.22.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.22.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.22.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.22.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.23.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.23.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.23.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.23.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.23.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.23.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.24.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.24.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.24.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.24.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.24.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.24.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.25.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.25.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.25.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.25.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.25.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.25.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.26.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.26.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.26.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.26.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.26.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.26.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.27.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.27.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.27.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.27.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.27.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.27.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.28.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.28.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.28.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.28.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.28.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.28.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.29.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.29.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.29.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.29.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.29.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.29.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.30.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.30.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.30.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.30.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.30.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.30.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.31.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.31.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.31.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.31.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.31.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.31.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.32.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.32.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.32.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.32.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.32.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.32.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.33.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.33.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.33.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.33.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.33.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.33.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.34.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.34.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.34.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.34.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.34.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.34.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.35.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.35.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.35.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.35.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.35.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.35.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.36.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.36.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.36.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.36.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.36.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.36.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.37.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.37.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.37.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.37.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.37.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.37.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.38.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.38.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.38.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.38.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.38.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.38.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.39.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.39.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.39.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.39.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.39.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.39.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.40.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.40.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.40.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.40.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.40.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.40.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.41.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.41.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.41.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.41.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.41.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.41.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.42.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.42.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.42.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.42.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.42.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.42.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.43.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.43.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.43.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.43.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.43.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.43.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.44.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.44.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.44.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.44.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.44.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.44.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.45.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.45.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.45.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.45.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.45.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.45.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.46.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.46.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.46.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.46.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.46.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.46.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.47.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.47.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.47.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.47.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.47.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.47.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.48.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.48.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.48.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.48.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.48.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.48.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.49.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.49.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.49.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.49.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.49.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.49.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.50.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.50.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.50.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.50.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.50.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.50.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.51.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.51.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.51.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.51.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.51.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.51.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.52.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.52.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.52.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.52.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.52.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.52.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.53.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.53.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.53.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.53.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.53.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.53.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.54.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.54.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.54.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.54.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.54.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.54.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.55.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.55.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.55.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.55.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.55.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.55.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.56.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.56.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.56.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.56.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.56.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.56.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.57.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.57.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.57.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.57.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.57.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.57.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.58.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.58.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.58.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.58.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.58.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.58.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.59.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.59.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.59.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.59.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.59.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.59.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.60.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.60.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.60.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.60.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.60.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.60.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.61.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.61.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.61.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.61.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.61.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.61.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.62.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.62.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.62.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.62.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.62.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.62.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.63.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.63.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.63.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.63.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.63.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.63.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.64.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.64.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.64.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.64.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.64.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.64.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.65.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.65.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.65.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.65.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.65.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.65.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.66.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.66.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.66.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.66.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.66.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.66.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.67.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.67.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.67.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.67.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.67.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.67.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.68.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.68.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.68.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.68.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.68.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.68.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.69.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.69.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.69.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.69.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.69.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.69.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.70.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.70.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.70.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.70.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.70.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.70.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.71.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.71.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.71.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.71.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.71.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.71.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.72.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.72.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.72.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.72.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.72.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.72.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.73.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.73.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.73.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.73.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.73.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.73.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.74.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.74.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.74.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.74.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.74.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.74.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.75.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.75.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.75.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.75.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.75.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.75.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.76.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.76.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.76.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.76.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.76.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.76.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.77.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.77.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.77.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.77.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.77.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.77.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.78.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.78.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.78.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.78.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.78.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.78.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.79.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.79.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.79.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.79.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.79.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.79.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.80.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.80.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.80.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.80.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.80.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.80.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.81.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.81.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.81.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.81.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.81.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.81.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.82.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.82.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.82.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.82.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.82.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.82.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.83.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.83.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.83.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.83.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.83.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.83.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.84.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.84.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.84.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.84.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.84.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.84.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.85.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.85.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.85.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.85.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.85.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.85.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.86.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.86.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.86.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.86.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.86.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.86.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.87.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.87.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.87.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.87.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.87.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.87.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.88.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.88.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.88.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.88.up_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.88.down_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.88.down_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.89.gate_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.89.gate_proj.weight_scale_inv": "model-00043-of-000163.safetensors", "model.layers.18.mlp.experts.89.up_proj.weight": "model-00043-of-000163.safetensors", - "model.layers.18.mlp.experts.89.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.89.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.89.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.90.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.90.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.90.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.90.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.90.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.90.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.91.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.91.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.91.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.91.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.91.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.91.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.92.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.92.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.92.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.92.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.92.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.92.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.93.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.93.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.93.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.93.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.93.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.93.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.94.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.94.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.94.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.94.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.94.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.94.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.95.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.95.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.95.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.95.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.95.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.95.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.96.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.96.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.96.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.96.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.96.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.96.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.97.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.97.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.97.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.97.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.97.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.97.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.98.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.98.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.98.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.98.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.98.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.98.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.99.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.99.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.99.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.99.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.99.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.99.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.100.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.100.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.100.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.100.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.100.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.100.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.101.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.101.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.101.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.101.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.101.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.101.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.102.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.102.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.102.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.102.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.102.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.102.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.103.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.103.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.103.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.103.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.103.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.103.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.104.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.104.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.104.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.104.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.104.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.104.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.105.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.105.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.105.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.105.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.105.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.105.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.106.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.106.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.106.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.106.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.106.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.106.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.107.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.107.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.107.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.107.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.107.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.107.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.108.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.108.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.108.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.108.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.108.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.108.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.109.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.109.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.109.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.109.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.109.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.109.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.110.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.110.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.110.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.110.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.110.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.110.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.111.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.111.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.111.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.111.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.111.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.111.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.112.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.112.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.112.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.112.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.112.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.112.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.113.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.113.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.113.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.113.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.113.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.113.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.114.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.114.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.114.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.114.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.114.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.114.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.115.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.115.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.115.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.115.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.115.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.115.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.116.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.116.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.116.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.116.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.116.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.116.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.117.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.117.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.117.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.117.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.117.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.117.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.118.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.118.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.118.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.118.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.118.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.118.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.119.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.119.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.119.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.119.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.119.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.119.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.120.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.120.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.120.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.120.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.120.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.120.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.121.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.121.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.121.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.121.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.121.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.121.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.122.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.122.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.122.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.122.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.122.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.122.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.123.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.123.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.123.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.123.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.123.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.123.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.124.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.124.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.124.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.124.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.124.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.124.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.125.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.125.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.125.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.125.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.125.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.125.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.126.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.126.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.126.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.126.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.126.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.126.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.127.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.127.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.127.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.127.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.127.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.127.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.128.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.128.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.128.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.128.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.128.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.128.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.129.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.129.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.129.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.129.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.129.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.129.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.130.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.130.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.130.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.130.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.130.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.130.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.131.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.131.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.131.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.131.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.131.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.131.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.132.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.132.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.132.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.132.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.132.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.132.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.133.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.133.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.133.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.133.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.133.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.133.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.134.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.134.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.134.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.134.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.134.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.134.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.135.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.135.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.135.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.135.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.135.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.135.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.136.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.136.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.136.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.136.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.136.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.136.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.137.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.137.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.137.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.137.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.137.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.137.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.138.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.138.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.138.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.138.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.138.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.138.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.139.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.139.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.139.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.139.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.139.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.139.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.140.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.140.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.140.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.140.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.140.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.140.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.141.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.141.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.141.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.141.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.141.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.141.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.142.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.142.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.142.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.142.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.142.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.142.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.143.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.143.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.143.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.143.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.143.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.143.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.144.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.144.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.144.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.144.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.144.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.144.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.145.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.145.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.145.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.145.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.145.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.145.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.146.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.146.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.146.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.146.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.146.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.146.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.147.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.147.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.147.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.147.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.147.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.147.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.148.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.148.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.148.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.148.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.148.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.148.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.149.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.149.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.149.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.149.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.149.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.149.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.150.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.150.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.150.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.150.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.150.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.150.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.151.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.151.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.151.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.151.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.151.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.151.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.152.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.152.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.152.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.152.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.152.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.152.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.153.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.153.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.153.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.153.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.153.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.153.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.154.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.154.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.154.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.154.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.154.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.154.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.155.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.155.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.155.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.155.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.155.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.155.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.156.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.156.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.156.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.156.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.156.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.156.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.157.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.157.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.157.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.157.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.157.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.157.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.158.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.158.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.158.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.158.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.158.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.158.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.159.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.159.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.159.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.159.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.159.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.159.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.160.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.160.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.160.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.160.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.160.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.160.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.161.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.161.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.161.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.161.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.161.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.161.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.162.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.162.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.162.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.162.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.162.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.162.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.163.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.163.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.163.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.163.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.163.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.163.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.164.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.164.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.164.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.164.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.164.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.164.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.165.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.165.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.165.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.165.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.165.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.165.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.166.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.166.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.166.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.166.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.166.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.166.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.167.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.167.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.167.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.167.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.167.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.167.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.168.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.168.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.168.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.168.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.168.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.168.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.169.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.169.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.169.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.169.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.169.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.169.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.170.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.170.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.170.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.170.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.170.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.170.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.171.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.171.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.171.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.171.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.171.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.171.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.172.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.172.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.172.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.172.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.172.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.172.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.173.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.173.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.173.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.173.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.173.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.173.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.174.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.174.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.174.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.174.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.174.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.174.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.175.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.175.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.175.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.175.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.175.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.175.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.176.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.176.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.176.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.176.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.176.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.176.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.177.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.177.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.177.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.177.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.177.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.177.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.178.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.178.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.178.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.178.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.178.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.178.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.179.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.179.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.179.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.179.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.179.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.179.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.180.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.180.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.180.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.180.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.180.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.180.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.181.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.181.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.181.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.181.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.181.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.181.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.182.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.182.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.182.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.182.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.182.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.182.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.183.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.183.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.183.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.183.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.183.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.183.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.184.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.184.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.184.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.184.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.184.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.184.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.185.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.185.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.185.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.185.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.185.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.185.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.186.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.186.gate_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.186.up_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.186.up_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.186.down_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.186.down_proj.weight_scale_inv": "model-00044-of-000163.safetensors", "model.layers.18.mlp.experts.187.gate_proj.weight": "model-00044-of-000163.safetensors", - "model.layers.18.mlp.experts.187.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.187.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.187.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.187.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.187.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.188.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.188.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.188.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.188.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.188.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.188.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.189.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.189.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.189.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.189.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.189.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.189.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.190.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.190.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.190.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.190.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.190.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.190.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.191.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.191.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.191.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.191.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.191.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.191.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.192.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.192.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.192.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.192.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.192.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.192.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.193.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.193.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.193.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.193.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.193.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.193.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.194.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.194.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.194.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.194.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.194.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.194.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.195.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.195.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.195.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.195.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.195.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.195.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.196.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.196.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.196.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.196.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.196.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.196.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.197.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.197.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.197.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.197.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.197.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.197.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.198.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.198.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.198.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.198.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.198.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.198.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.199.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.199.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.199.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.199.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.199.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.199.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.200.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.200.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.200.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.200.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.200.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.200.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.201.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.201.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.201.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.201.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.201.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.201.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.202.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.202.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.202.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.202.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.202.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.202.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.203.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.203.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.203.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.203.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.203.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.203.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.204.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.204.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.204.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.204.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.204.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.204.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.205.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.205.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.205.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.205.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.205.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.205.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.206.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.206.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.206.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.206.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.206.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.206.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.207.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.207.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.207.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.207.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.207.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.207.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.208.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.208.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.208.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.208.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.208.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.208.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.209.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.209.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.209.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.209.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.209.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.209.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.210.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.210.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.210.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.210.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.210.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.210.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.211.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.211.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.211.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.211.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.211.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.211.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.212.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.212.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.212.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.212.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.212.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.212.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.213.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.213.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.213.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.213.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.213.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.213.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.214.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.214.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.214.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.214.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.214.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.214.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.215.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.215.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.215.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.215.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.215.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.215.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.216.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.216.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.216.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.216.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.216.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.216.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.217.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.217.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.217.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.217.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.217.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.217.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.218.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.218.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.218.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.218.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.218.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.218.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.219.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.219.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.219.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.219.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.219.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.219.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.220.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.220.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.220.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.220.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.220.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.220.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.221.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.221.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.221.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.221.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.221.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.221.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.222.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.222.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.222.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.222.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.222.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.222.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.223.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.223.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.223.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.223.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.223.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.223.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.224.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.224.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.224.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.224.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.224.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.224.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.225.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.225.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.225.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.225.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.225.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.225.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.226.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.226.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.226.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.226.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.226.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.226.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.227.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.227.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.227.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.227.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.227.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.227.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.228.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.228.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.228.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.228.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.228.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.228.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.229.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.229.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.229.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.229.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.229.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.229.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.230.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.230.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.230.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.230.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.230.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.230.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.231.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.231.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.231.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.231.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.231.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.231.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.232.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.232.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.232.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.232.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.232.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.232.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.233.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.233.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.233.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.233.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.233.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.233.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.234.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.234.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.234.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.234.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.234.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.234.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.235.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.235.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.235.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.235.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.235.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.235.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.236.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.236.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.236.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.236.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.236.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.236.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.237.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.237.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.237.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.237.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.237.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.237.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.238.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.238.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.238.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.238.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.238.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.238.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.239.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.239.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.239.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.239.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.239.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.239.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.240.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.240.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.240.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.240.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.240.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.240.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.241.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.241.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.241.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.241.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.241.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.241.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.242.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.242.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.242.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.242.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.242.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.242.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.243.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.243.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.243.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.243.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.243.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.243.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.244.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.244.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.244.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.244.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.244.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.244.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.245.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.245.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.245.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.245.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.245.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.245.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.246.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.246.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.246.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.246.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.246.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.246.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.247.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.247.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.247.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.247.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.247.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.247.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.248.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.248.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.248.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.248.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.248.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.248.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.249.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.249.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.249.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.249.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.249.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.249.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.250.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.250.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.250.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.250.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.250.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.250.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.251.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.251.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.251.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.251.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.251.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.251.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.252.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.252.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.252.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.252.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.252.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.252.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.253.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.253.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.253.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.253.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.253.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.253.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.254.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.254.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.254.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.254.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.254.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.254.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.255.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.255.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.255.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.255.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.mlp.experts.255.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.18.mlp.experts.255.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.18.input_layernorm.weight": "model-00045-of-000163.safetensors", "model.layers.18.post_attention_layernorm.weight": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.q_a_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.self_attn.q_a_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.q_a_layernorm.weight": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.q_b_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.self_attn.q_b_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.kv_a_proj_with_mqa.weight": "model-00045-of-000163.safetensors", - "model.layers.19.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.kv_a_layernorm.weight": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.kv_b_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.self_attn.kv_b_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.self_attn.o_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.self_attn.o_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.gate.weight": "model-00045-of-000163.safetensors", "model.layers.19.mlp.gate.e_score_correction_bias": "model-00045-of-000163.safetensors", "model.layers.19.mlp.shared_experts.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.shared_experts.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.shared_experts.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.shared_experts.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.shared_experts.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.0.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.0.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.0.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.0.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.0.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.0.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.1.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.1.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.1.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.1.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.1.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.1.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.2.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.2.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.2.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.2.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.2.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.2.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.3.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.3.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.3.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.3.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.3.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.3.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.4.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.4.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.4.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.4.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.4.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.4.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.5.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.5.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.5.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.5.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.5.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.5.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.6.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.6.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.6.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.6.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.6.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.6.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.7.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.7.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.7.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.7.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.7.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.7.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.8.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.8.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.8.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.8.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.8.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.8.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.9.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.9.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.9.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.9.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.9.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.9.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.10.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.10.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.10.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.10.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.10.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.10.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.11.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.11.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.11.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.11.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.11.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.11.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.12.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.12.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.12.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.12.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.12.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.12.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.13.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.13.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.13.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.13.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.13.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.13.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.14.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.14.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.14.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.14.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.14.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.14.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.15.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.15.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.15.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.15.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.15.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.15.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.16.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.16.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.16.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.16.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.16.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.16.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.17.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.17.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.17.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.17.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.17.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.17.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.18.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.18.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.18.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.18.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.18.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.18.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.19.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.19.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.19.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.19.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.19.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.19.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.20.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.20.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.20.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.20.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.20.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.20.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.21.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.21.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.21.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.21.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.21.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.21.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.22.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.22.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.22.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.22.up_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.22.down_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.22.down_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.23.gate_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.23.gate_proj.weight_scale_inv": "model-00045-of-000163.safetensors", "model.layers.19.mlp.experts.23.up_proj.weight": "model-00045-of-000163.safetensors", - "model.layers.19.mlp.experts.23.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.23.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.23.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.24.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.24.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.24.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.24.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.24.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.24.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.25.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.25.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.25.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.25.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.25.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.25.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.26.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.26.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.26.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.26.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.26.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.26.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.27.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.27.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.27.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.27.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.27.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.27.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.28.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.28.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.28.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.28.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.28.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.28.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.29.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.29.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.29.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.29.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.29.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.29.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.30.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.30.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.30.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.30.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.30.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.30.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.31.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.31.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.31.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.31.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.31.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.31.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.32.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.32.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.32.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.32.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.32.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.32.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.33.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.33.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.33.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.33.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.33.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.33.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.34.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.34.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.34.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.34.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.34.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.34.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.35.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.35.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.35.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.35.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.35.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.35.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.36.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.36.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.36.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.36.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.36.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.36.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.37.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.37.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.37.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.37.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.37.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.37.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.38.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.38.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.38.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.38.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.38.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.38.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.39.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.39.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.39.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.39.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.39.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.39.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.40.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.40.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.40.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.40.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.40.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.40.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.41.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.41.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.41.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.41.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.41.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.41.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.42.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.42.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.42.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.42.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.42.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.42.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.43.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.43.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.43.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.43.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.43.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.43.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.44.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.44.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.44.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.44.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.44.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.44.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.45.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.45.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.45.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.45.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.45.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.45.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.46.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.46.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.46.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.46.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.46.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.46.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.47.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.47.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.47.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.47.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.47.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.47.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.48.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.48.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.48.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.48.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.48.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.48.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.49.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.49.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.49.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.49.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.49.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.49.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.50.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.50.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.50.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.50.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.50.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.50.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.51.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.51.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.51.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.51.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.51.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.51.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.52.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.52.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.52.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.52.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.52.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.52.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.53.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.53.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.53.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.53.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.53.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.53.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.54.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.54.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.54.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.54.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.54.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.54.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.55.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.55.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.55.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.55.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.55.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.55.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.56.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.56.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.56.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.56.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.56.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.56.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.57.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.57.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.57.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.57.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.57.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.57.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.58.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.58.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.58.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.58.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.58.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.58.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.59.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.59.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.59.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.59.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.59.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.59.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.60.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.60.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.60.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.60.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.60.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.60.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.61.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.61.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.61.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.61.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.61.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.61.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.62.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.62.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.62.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.62.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.62.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.62.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.63.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.63.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.63.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.63.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.63.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.63.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.64.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.64.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.64.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.64.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.64.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.64.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.65.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.65.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.65.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.65.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.65.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.65.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.66.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.66.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.66.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.66.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.66.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.66.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.67.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.67.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.67.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.67.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.67.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.67.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.68.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.68.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.68.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.68.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.68.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.68.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.69.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.69.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.69.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.69.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.69.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.69.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.70.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.70.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.70.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.70.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.70.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.70.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.71.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.71.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.71.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.71.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.71.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.71.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.72.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.72.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.72.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.72.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.72.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.72.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.73.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.73.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.73.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.73.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.73.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.73.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.74.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.74.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.74.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.74.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.74.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.74.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.75.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.75.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.75.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.75.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.75.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.75.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.76.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.76.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.76.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.76.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.76.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.76.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.77.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.77.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.77.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.77.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.77.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.77.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.78.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.78.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.78.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.78.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.78.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.78.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.79.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.79.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.79.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.79.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.79.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.79.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.80.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.80.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.80.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.80.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.80.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.80.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.81.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.81.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.81.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.81.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.81.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.81.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.82.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.82.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.82.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.82.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.82.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.82.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.83.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.83.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.83.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.83.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.83.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.83.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.84.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.84.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.84.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.84.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.84.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.84.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.85.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.85.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.85.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.85.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.85.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.85.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.86.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.86.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.86.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.86.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.86.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.86.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.87.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.87.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.87.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.87.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.87.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.87.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.88.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.88.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.88.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.88.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.88.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.88.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.89.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.89.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.89.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.89.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.89.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.89.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.90.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.90.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.90.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.90.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.90.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.90.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.91.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.91.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.91.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.91.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.91.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.91.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.92.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.92.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.92.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.92.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.92.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.92.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.93.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.93.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.93.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.93.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.93.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.93.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.94.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.94.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.94.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.94.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.94.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.94.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.95.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.95.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.95.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.95.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.95.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.95.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.96.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.96.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.96.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.96.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.96.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.96.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.97.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.97.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.97.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.97.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.97.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.97.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.98.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.98.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.98.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.98.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.98.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.98.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.99.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.99.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.99.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.99.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.99.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.99.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.100.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.100.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.100.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.100.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.100.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.100.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.101.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.101.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.101.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.101.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.101.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.101.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.102.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.102.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.102.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.102.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.102.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.102.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.103.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.103.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.103.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.103.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.103.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.103.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.104.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.104.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.104.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.104.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.104.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.104.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.105.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.105.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.105.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.105.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.105.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.105.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.106.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.106.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.106.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.106.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.106.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.106.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.107.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.107.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.107.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.107.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.107.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.107.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.108.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.108.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.108.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.108.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.108.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.108.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.109.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.109.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.109.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.109.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.109.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.109.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.110.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.110.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.110.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.110.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.110.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.110.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.111.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.111.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.111.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.111.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.111.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.111.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.112.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.112.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.112.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.112.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.112.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.112.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.113.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.113.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.113.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.113.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.113.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.113.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.114.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.114.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.114.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.114.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.114.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.114.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.115.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.115.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.115.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.115.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.115.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.115.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.116.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.116.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.116.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.116.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.116.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.116.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.117.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.117.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.117.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.117.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.117.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.117.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.118.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.118.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.118.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.118.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.118.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.118.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.119.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.119.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.119.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.119.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.119.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.119.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.120.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.120.gate_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.120.up_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.120.up_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.120.down_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.120.down_proj.weight_scale_inv": "model-00046-of-000163.safetensors", "model.layers.19.mlp.experts.121.gate_proj.weight": "model-00046-of-000163.safetensors", - "model.layers.19.mlp.experts.121.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.121.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.121.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.121.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.121.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.122.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.122.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.122.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.122.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.122.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.122.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.123.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.123.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.123.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.123.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.123.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.123.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.124.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.124.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.124.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.124.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.124.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.124.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.125.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.125.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.125.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.125.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.125.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.125.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.126.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.126.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.126.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.126.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.126.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.126.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.127.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.127.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.127.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.127.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.127.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.127.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.128.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.128.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.128.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.128.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.128.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.128.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.129.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.129.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.129.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.129.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.129.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.129.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.130.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.130.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.130.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.130.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.130.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.130.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.131.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.131.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.131.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.131.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.131.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.131.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.132.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.132.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.132.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.132.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.132.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.132.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.133.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.133.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.133.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.133.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.133.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.133.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.134.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.134.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.134.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.134.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.134.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.134.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.135.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.135.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.135.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.135.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.135.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.135.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.136.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.136.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.136.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.136.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.136.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.136.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.137.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.137.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.137.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.137.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.137.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.137.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.138.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.138.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.138.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.138.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.138.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.138.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.139.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.139.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.139.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.139.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.139.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.139.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.140.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.140.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.140.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.140.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.140.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.140.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.141.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.141.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.141.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.141.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.141.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.141.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.142.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.142.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.142.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.142.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.142.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.142.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.143.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.143.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.143.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.143.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.143.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.143.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.144.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.144.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.144.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.144.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.144.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.144.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.145.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.145.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.145.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.145.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.145.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.145.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.146.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.146.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.146.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.146.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.146.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.146.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.147.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.147.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.147.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.147.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.147.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.147.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.148.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.148.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.148.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.148.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.148.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.148.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.149.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.149.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.149.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.149.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.149.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.149.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.150.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.150.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.150.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.150.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.150.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.150.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.151.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.151.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.151.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.151.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.151.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.151.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.152.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.152.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.152.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.152.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.152.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.152.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.153.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.153.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.153.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.153.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.153.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.153.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.154.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.154.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.154.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.154.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.154.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.154.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.155.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.155.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.155.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.155.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.155.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.155.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.156.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.156.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.156.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.156.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.156.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.156.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.157.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.157.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.157.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.157.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.157.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.157.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.158.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.158.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.158.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.158.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.158.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.158.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.159.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.159.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.159.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.159.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.159.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.159.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.160.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.160.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.160.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.160.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.160.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.160.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.161.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.161.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.161.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.161.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.161.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.161.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.162.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.162.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.162.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.162.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.162.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.162.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.163.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.163.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.163.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.163.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.163.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.163.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.164.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.164.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.164.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.164.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.164.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.164.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.165.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.165.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.165.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.165.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.165.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.165.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.166.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.166.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.166.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.166.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.166.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.166.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.167.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.167.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.167.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.167.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.167.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.167.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.168.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.168.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.168.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.168.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.168.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.168.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.169.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.169.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.169.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.169.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.169.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.169.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.170.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.170.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.170.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.170.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.170.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.170.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.171.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.171.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.171.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.171.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.171.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.171.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.172.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.172.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.172.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.172.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.172.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.172.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.173.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.173.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.173.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.173.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.173.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.173.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.174.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.174.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.174.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.174.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.174.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.174.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.175.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.175.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.175.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.175.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.175.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.175.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.176.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.176.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.176.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.176.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.176.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.176.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.177.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.177.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.177.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.177.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.177.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.177.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.178.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.178.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.178.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.178.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.178.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.178.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.179.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.179.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.179.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.179.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.179.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.179.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.180.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.180.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.180.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.180.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.180.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.180.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.181.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.181.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.181.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.181.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.181.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.181.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.182.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.182.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.182.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.182.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.182.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.182.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.183.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.183.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.183.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.183.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.183.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.183.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.184.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.184.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.184.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.184.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.184.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.184.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.185.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.185.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.185.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.185.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.185.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.185.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.186.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.186.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.186.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.186.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.186.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.186.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.187.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.187.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.187.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.187.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.187.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.187.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.188.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.188.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.188.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.188.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.188.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.188.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.189.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.189.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.189.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.189.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.189.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.189.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.190.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.190.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.190.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.190.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.190.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.190.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.191.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.191.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.191.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.191.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.191.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.191.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.192.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.192.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.192.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.192.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.192.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.192.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.193.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.193.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.193.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.193.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.193.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.193.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.194.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.194.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.194.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.194.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.194.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.194.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.195.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.195.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.195.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.195.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.195.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.195.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.196.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.196.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.196.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.196.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.196.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.196.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.197.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.197.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.197.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.197.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.197.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.197.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.198.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.198.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.198.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.198.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.198.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.198.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.199.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.199.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.199.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.199.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.199.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.199.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.200.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.200.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.200.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.200.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.200.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.200.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.201.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.201.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.201.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.201.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.201.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.201.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.202.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.202.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.202.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.202.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.202.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.202.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.203.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.203.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.203.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.203.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.203.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.203.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.204.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.204.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.204.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.204.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.204.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.204.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.205.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.205.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.205.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.205.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.205.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.205.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.206.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.206.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.206.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.206.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.206.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.206.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.207.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.207.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.207.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.207.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.207.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.207.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.208.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.208.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.208.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.208.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.208.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.208.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.209.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.209.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.209.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.209.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.209.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.209.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.210.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.210.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.210.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.210.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.210.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.210.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.211.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.211.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.211.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.211.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.211.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.211.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.212.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.212.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.212.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.212.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.212.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.212.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.213.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.213.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.213.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.213.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.213.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.213.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.214.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.214.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.214.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.214.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.214.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.214.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.215.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.215.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.215.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.215.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.215.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.215.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.216.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.216.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.216.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.216.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.216.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.216.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.217.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.217.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.217.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.217.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.217.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.217.down_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.218.gate_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.218.gate_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.218.up_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.218.up_proj.weight_scale_inv": "model-00047-of-000163.safetensors", "model.layers.19.mlp.experts.218.down_proj.weight": "model-00047-of-000163.safetensors", - "model.layers.19.mlp.experts.218.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.219.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.219.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.219.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.219.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.219.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.219.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.220.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.220.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.220.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.220.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.220.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.220.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.221.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.221.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.221.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.221.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.221.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.221.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.222.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.222.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.222.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.222.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.222.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.222.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.223.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.223.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.223.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.223.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.223.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.223.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.224.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.224.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.224.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.224.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.224.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.224.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.225.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.225.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.225.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.225.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.225.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.225.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.226.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.226.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.226.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.226.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.226.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.226.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.227.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.227.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.227.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.227.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.227.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.227.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.228.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.228.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.228.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.228.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.228.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.228.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.229.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.229.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.229.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.229.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.229.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.229.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.230.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.230.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.230.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.230.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.230.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.230.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.231.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.231.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.231.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.231.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.231.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.231.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.232.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.232.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.232.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.232.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.232.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.232.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.233.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.233.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.233.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.233.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.233.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.233.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.234.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.234.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.234.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.234.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.234.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.234.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.235.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.235.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.235.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.235.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.235.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.235.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.236.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.236.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.236.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.236.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.236.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.236.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.237.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.237.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.237.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.237.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.237.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.237.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.238.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.238.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.238.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.238.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.238.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.238.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.239.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.239.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.239.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.239.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.239.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.239.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.240.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.240.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.240.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.240.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.240.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.240.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.241.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.241.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.241.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.241.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.241.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.241.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.242.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.242.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.242.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.242.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.242.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.242.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.243.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.243.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.243.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.243.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.243.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.243.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.244.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.244.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.244.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.244.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.244.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.244.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.245.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.245.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.245.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.245.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.245.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.245.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.246.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.246.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.246.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.246.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.246.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.246.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.247.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.247.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.247.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.247.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.247.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.247.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.248.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.248.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.248.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.248.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.248.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.248.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.249.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.249.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.249.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.249.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.249.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.249.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.250.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.250.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.250.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.250.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.250.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.250.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.251.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.251.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.251.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.251.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.251.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.251.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.252.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.252.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.252.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.252.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.252.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.252.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.253.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.253.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.253.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.253.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.253.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.253.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.254.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.254.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.254.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.254.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.254.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.254.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.255.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.255.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.255.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.255.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.mlp.experts.255.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.19.mlp.experts.255.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.19.input_layernorm.weight": "model-00048-of-000163.safetensors", "model.layers.19.post_attention_layernorm.weight": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.q_a_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.self_attn.q_a_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.q_a_layernorm.weight": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.q_b_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.self_attn.q_b_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.kv_a_proj_with_mqa.weight": "model-00048-of-000163.safetensors", - "model.layers.20.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.kv_a_layernorm.weight": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.kv_b_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.self_attn.kv_b_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.self_attn.o_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.self_attn.o_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.gate.weight": "model-00048-of-000163.safetensors", "model.layers.20.mlp.gate.e_score_correction_bias": "model-00048-of-000163.safetensors", "model.layers.20.mlp.shared_experts.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.shared_experts.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.shared_experts.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.shared_experts.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.shared_experts.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.0.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.0.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.0.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.0.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.0.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.0.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.1.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.1.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.1.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.1.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.1.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.1.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.2.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.2.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.2.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.2.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.2.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.2.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.3.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.3.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.3.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.3.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.3.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.3.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.4.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.4.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.4.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.4.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.4.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.4.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.5.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.5.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.5.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.5.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.5.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.5.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.6.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.6.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.6.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.6.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.6.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.6.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.7.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.7.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.7.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.7.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.7.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.7.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.8.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.8.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.8.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.8.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.8.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.8.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.9.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.9.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.9.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.9.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.9.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.9.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.10.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.10.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.10.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.10.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.10.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.10.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.11.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.11.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.11.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.11.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.11.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.11.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.12.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.12.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.12.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.12.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.12.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.12.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.13.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.13.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.13.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.13.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.13.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.13.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.14.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.14.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.14.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.14.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.14.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.14.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.15.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.15.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.15.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.15.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.15.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.15.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.16.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.16.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.16.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.16.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.16.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.16.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.17.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.17.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.17.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.17.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.17.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.17.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.18.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.18.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.18.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.18.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.18.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.18.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.19.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.19.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.19.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.19.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.19.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.19.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.20.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.20.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.20.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.20.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.20.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.20.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.21.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.21.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.21.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.21.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.21.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.21.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.22.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.22.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.22.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.22.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.22.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.22.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.23.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.23.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.23.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.23.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.23.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.23.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.24.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.24.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.24.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.24.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.24.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.24.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.25.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.25.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.25.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.25.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.25.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.25.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.26.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.26.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.26.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.26.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.26.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.26.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.27.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.27.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.27.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.27.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.27.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.27.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.28.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.28.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.28.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.28.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.28.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.28.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.29.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.29.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.29.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.29.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.29.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.29.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.30.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.30.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.30.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.30.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.30.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.30.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.31.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.31.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.31.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.31.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.31.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.31.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.32.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.32.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.32.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.32.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.32.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.32.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.33.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.33.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.33.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.33.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.33.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.33.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.34.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.34.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.34.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.34.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.34.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.34.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.35.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.35.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.35.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.35.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.35.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.35.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.36.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.36.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.36.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.36.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.36.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.36.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.37.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.37.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.37.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.37.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.37.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.37.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.38.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.38.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.38.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.38.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.38.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.38.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.39.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.39.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.39.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.39.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.39.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.39.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.40.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.40.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.40.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.40.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.40.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.40.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.41.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.41.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.41.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.41.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.41.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.41.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.42.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.42.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.42.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.42.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.42.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.42.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.43.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.43.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.43.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.43.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.43.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.43.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.44.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.44.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.44.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.44.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.44.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.44.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.45.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.45.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.45.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.45.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.45.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.45.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.46.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.46.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.46.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.46.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.46.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.46.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.47.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.47.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.47.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.47.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.47.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.47.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.48.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.48.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.48.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.48.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.48.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.48.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.49.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.49.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.49.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.49.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.49.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.49.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.50.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.50.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.50.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.50.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.50.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.50.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.51.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.51.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.51.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.51.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.51.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.51.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.52.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.52.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.52.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.52.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.52.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.52.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.53.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.53.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.53.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.53.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.53.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.53.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.54.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.54.gate_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.54.up_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.54.up_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.54.down_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.54.down_proj.weight_scale_inv": "model-00048-of-000163.safetensors", "model.layers.20.mlp.experts.55.gate_proj.weight": "model-00048-of-000163.safetensors", - "model.layers.20.mlp.experts.55.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.55.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.55.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.55.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.55.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.56.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.56.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.56.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.56.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.56.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.56.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.57.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.57.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.57.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.57.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.57.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.57.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.58.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.58.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.58.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.58.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.58.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.58.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.59.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.59.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.59.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.59.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.59.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.59.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.60.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.60.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.60.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.60.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.60.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.60.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.61.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.61.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.61.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.61.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.61.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.61.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.62.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.62.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.62.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.62.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.62.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.62.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.63.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.63.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.63.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.63.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.63.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.63.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.64.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.64.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.64.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.64.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.64.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.64.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.65.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.65.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.65.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.65.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.65.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.65.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.66.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.66.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.66.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.66.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.66.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.66.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.67.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.67.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.67.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.67.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.67.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.67.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.68.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.68.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.68.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.68.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.68.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.68.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.69.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.69.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.69.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.69.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.69.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.69.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.70.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.70.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.70.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.70.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.70.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.70.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.71.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.71.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.71.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.71.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.71.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.71.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.72.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.72.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.72.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.72.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.72.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.72.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.73.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.73.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.73.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.73.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.73.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.73.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.74.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.74.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.74.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.74.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.74.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.74.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.75.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.75.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.75.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.75.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.75.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.75.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.76.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.76.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.76.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.76.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.76.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.76.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.77.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.77.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.77.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.77.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.77.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.77.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.78.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.78.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.78.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.78.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.78.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.78.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.79.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.79.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.79.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.79.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.79.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.79.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.80.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.80.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.80.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.80.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.80.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.80.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.81.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.81.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.81.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.81.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.81.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.81.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.82.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.82.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.82.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.82.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.82.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.82.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.83.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.83.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.83.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.83.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.83.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.83.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.84.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.84.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.84.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.84.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.84.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.84.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.85.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.85.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.85.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.85.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.85.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.85.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.86.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.86.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.86.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.86.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.86.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.86.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.87.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.87.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.87.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.87.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.87.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.87.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.88.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.88.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.88.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.88.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.88.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.88.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.89.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.89.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.89.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.89.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.89.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.89.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.90.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.90.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.90.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.90.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.90.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.90.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.91.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.91.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.91.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.91.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.91.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.91.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.92.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.92.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.92.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.92.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.92.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.92.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.93.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.93.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.93.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.93.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.93.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.93.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.94.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.94.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.94.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.94.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.94.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.94.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.95.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.95.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.95.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.95.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.95.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.95.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.96.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.96.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.96.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.96.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.96.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.96.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.97.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.97.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.97.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.97.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.97.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.97.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.98.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.98.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.98.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.98.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.98.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.98.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.99.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.99.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.99.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.99.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.99.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.99.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.100.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.100.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.100.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.100.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.100.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.100.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.101.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.101.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.101.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.101.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.101.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.101.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.102.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.102.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.102.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.102.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.102.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.102.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.103.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.103.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.103.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.103.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.103.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.103.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.104.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.104.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.104.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.104.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.104.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.104.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.105.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.105.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.105.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.105.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.105.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.105.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.106.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.106.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.106.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.106.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.106.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.106.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.107.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.107.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.107.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.107.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.107.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.107.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.108.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.108.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.108.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.108.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.108.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.108.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.109.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.109.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.109.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.109.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.109.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.109.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.110.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.110.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.110.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.110.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.110.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.110.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.111.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.111.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.111.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.111.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.111.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.111.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.112.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.112.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.112.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.112.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.112.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.112.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.113.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.113.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.113.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.113.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.113.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.113.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.114.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.114.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.114.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.114.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.114.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.114.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.115.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.115.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.115.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.115.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.115.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.115.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.116.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.116.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.116.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.116.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.116.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.116.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.117.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.117.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.117.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.117.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.117.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.117.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.118.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.118.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.118.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.118.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.118.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.118.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.119.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.119.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.119.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.119.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.119.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.119.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.120.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.120.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.120.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.120.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.120.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.120.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.121.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.121.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.121.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.121.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.121.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.121.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.122.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.122.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.122.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.122.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.122.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.122.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.123.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.123.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.123.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.123.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.123.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.123.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.124.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.124.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.124.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.124.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.124.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.124.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.125.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.125.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.125.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.125.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.125.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.125.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.126.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.126.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.126.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.126.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.126.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.126.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.127.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.127.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.127.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.127.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.127.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.127.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.128.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.128.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.128.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.128.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.128.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.128.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.129.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.129.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.129.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.129.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.129.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.129.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.130.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.130.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.130.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.130.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.130.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.130.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.131.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.131.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.131.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.131.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.131.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.131.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.132.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.132.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.132.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.132.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.132.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.132.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.133.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.133.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.133.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.133.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.133.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.133.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.134.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.134.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.134.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.134.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.134.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.134.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.135.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.135.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.135.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.135.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.135.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.135.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.136.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.136.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.136.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.136.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.136.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.136.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.137.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.137.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.137.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.137.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.137.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.137.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.138.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.138.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.138.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.138.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.138.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.138.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.139.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.139.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.139.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.139.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.139.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.139.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.140.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.140.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.140.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.140.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.140.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.140.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.141.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.141.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.141.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.141.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.141.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.141.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.142.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.142.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.142.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.142.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.142.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.142.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.143.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.143.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.143.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.143.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.143.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.143.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.144.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.144.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.144.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.144.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.144.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.144.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.145.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.145.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.145.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.145.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.145.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.145.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.146.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.146.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.146.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.146.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.146.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.146.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.147.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.147.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.147.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.147.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.147.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.147.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.148.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.148.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.148.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.148.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.148.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.148.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.149.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.149.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.149.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.149.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.149.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.149.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.150.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.150.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.150.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.150.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.150.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.150.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.151.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.151.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.151.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.151.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.151.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.151.down_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.152.gate_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.152.gate_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.152.up_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.152.up_proj.weight_scale_inv": "model-00049-of-000163.safetensors", "model.layers.20.mlp.experts.152.down_proj.weight": "model-00049-of-000163.safetensors", - "model.layers.20.mlp.experts.152.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.153.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.153.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.153.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.153.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.153.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.153.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.154.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.154.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.154.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.154.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.154.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.154.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.155.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.155.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.155.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.155.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.155.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.155.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.156.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.156.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.156.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.156.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.156.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.156.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.157.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.157.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.157.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.157.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.157.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.157.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.158.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.158.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.158.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.158.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.158.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.158.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.159.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.159.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.159.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.159.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.159.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.159.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.160.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.160.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.160.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.160.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.160.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.160.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.161.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.161.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.161.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.161.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.161.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.161.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.162.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.162.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.162.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.162.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.162.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.162.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.163.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.163.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.163.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.163.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.163.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.163.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.164.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.164.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.164.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.164.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.164.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.164.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.165.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.165.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.165.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.165.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.165.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.165.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.166.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.166.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.166.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.166.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.166.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.166.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.167.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.167.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.167.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.167.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.167.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.167.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.168.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.168.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.168.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.168.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.168.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.168.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.169.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.169.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.169.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.169.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.169.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.169.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.170.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.170.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.170.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.170.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.170.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.170.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.171.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.171.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.171.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.171.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.171.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.171.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.172.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.172.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.172.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.172.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.172.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.172.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.173.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.173.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.173.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.173.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.173.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.173.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.174.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.174.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.174.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.174.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.174.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.174.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.175.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.175.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.175.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.175.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.175.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.175.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.176.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.176.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.176.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.176.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.176.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.176.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.177.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.177.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.177.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.177.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.177.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.177.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.178.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.178.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.178.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.178.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.178.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.178.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.179.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.179.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.179.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.179.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.179.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.179.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.180.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.180.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.180.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.180.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.180.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.180.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.181.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.181.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.181.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.181.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.181.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.181.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.182.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.182.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.182.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.182.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.182.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.182.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.183.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.183.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.183.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.183.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.183.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.183.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.184.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.184.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.184.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.184.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.184.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.184.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.185.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.185.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.185.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.185.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.185.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.185.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.186.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.186.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.186.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.186.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.186.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.186.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.187.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.187.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.187.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.187.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.187.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.187.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.188.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.188.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.188.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.188.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.188.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.188.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.189.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.189.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.189.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.189.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.189.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.189.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.190.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.190.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.190.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.190.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.190.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.190.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.191.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.191.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.191.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.191.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.191.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.191.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.192.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.192.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.192.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.192.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.192.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.192.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.193.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.193.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.193.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.193.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.193.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.193.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.194.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.194.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.194.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.194.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.194.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.194.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.195.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.195.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.195.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.195.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.195.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.195.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.196.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.196.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.196.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.196.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.196.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.196.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.197.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.197.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.197.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.197.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.197.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.197.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.198.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.198.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.198.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.198.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.198.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.198.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.199.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.199.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.199.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.199.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.199.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.199.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.200.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.200.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.200.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.200.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.200.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.200.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.201.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.201.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.201.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.201.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.201.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.201.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.202.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.202.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.202.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.202.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.202.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.202.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.203.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.203.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.203.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.203.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.203.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.203.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.204.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.204.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.204.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.204.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.204.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.204.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.205.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.205.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.205.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.205.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.205.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.205.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.206.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.206.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.206.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.206.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.206.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.206.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.207.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.207.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.207.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.207.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.207.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.207.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.208.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.208.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.208.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.208.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.208.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.208.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.209.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.209.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.209.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.209.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.209.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.209.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.210.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.210.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.210.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.210.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.210.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.210.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.211.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.211.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.211.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.211.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.211.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.211.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.212.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.212.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.212.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.212.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.212.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.212.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.213.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.213.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.213.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.213.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.213.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.213.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.214.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.214.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.214.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.214.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.214.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.214.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.215.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.215.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.215.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.215.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.215.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.215.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.216.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.216.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.216.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.216.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.216.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.216.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.217.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.217.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.217.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.217.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.217.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.217.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.218.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.218.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.218.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.218.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.218.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.218.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.219.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.219.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.219.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.219.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.219.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.219.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.220.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.220.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.220.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.220.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.220.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.220.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.221.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.221.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.221.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.221.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.221.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.221.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.222.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.222.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.222.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.222.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.222.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.222.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.223.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.223.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.223.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.223.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.223.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.223.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.224.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.224.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.224.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.224.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.224.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.224.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.225.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.225.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.225.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.225.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.225.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.225.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.226.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.226.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.226.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.226.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.226.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.226.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.227.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.227.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.227.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.227.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.227.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.227.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.228.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.228.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.228.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.228.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.228.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.228.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.229.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.229.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.229.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.229.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.229.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.229.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.230.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.230.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.230.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.230.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.230.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.230.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.231.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.231.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.231.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.231.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.231.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.231.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.232.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.232.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.232.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.232.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.232.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.232.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.233.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.233.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.233.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.233.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.233.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.233.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.234.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.234.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.234.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.234.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.234.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.234.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.235.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.235.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.235.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.235.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.235.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.235.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.236.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.236.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.236.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.236.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.236.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.236.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.237.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.237.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.237.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.237.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.237.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.237.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.238.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.238.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.238.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.238.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.238.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.238.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.239.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.239.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.239.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.239.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.239.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.239.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.240.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.240.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.240.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.240.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.240.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.240.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.241.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.241.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.241.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.241.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.241.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.241.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.242.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.242.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.242.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.242.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.242.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.242.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.243.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.243.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.243.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.243.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.243.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.243.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.244.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.244.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.244.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.244.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.244.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.244.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.245.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.245.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.245.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.245.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.245.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.245.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.246.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.246.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.246.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.246.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.246.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.246.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.247.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.247.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.247.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.247.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.247.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.247.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.248.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.248.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.248.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.248.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.248.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.248.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.249.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.249.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.249.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.249.up_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.249.down_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.249.down_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.250.gate_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.250.gate_proj.weight_scale_inv": "model-00050-of-000163.safetensors", "model.layers.20.mlp.experts.250.up_proj.weight": "model-00050-of-000163.safetensors", - "model.layers.20.mlp.experts.250.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.250.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.250.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.251.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.251.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.251.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.251.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.251.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.251.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.252.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.252.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.252.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.252.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.252.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.252.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.253.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.253.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.253.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.253.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.253.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.253.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.254.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.254.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.254.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.254.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.254.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.254.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.255.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.255.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.255.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.255.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.mlp.experts.255.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.20.mlp.experts.255.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.20.input_layernorm.weight": "model-00051-of-000163.safetensors", "model.layers.20.post_attention_layernorm.weight": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.q_a_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.self_attn.q_a_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.q_a_layernorm.weight": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.q_b_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.self_attn.q_b_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.kv_a_proj_with_mqa.weight": "model-00051-of-000163.safetensors", - "model.layers.21.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.kv_a_layernorm.weight": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.kv_b_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.self_attn.kv_b_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.self_attn.o_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.self_attn.o_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.gate.weight": "model-00051-of-000163.safetensors", "model.layers.21.mlp.gate.e_score_correction_bias": "model-00051-of-000163.safetensors", "model.layers.21.mlp.shared_experts.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.shared_experts.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.shared_experts.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.shared_experts.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.shared_experts.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.0.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.0.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.0.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.0.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.0.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.0.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.1.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.1.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.1.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.1.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.1.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.1.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.2.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.2.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.2.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.2.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.2.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.2.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.3.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.3.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.3.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.3.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.3.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.3.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.4.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.4.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.4.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.4.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.4.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.4.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.5.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.5.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.5.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.5.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.5.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.5.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.6.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.6.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.6.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.6.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.6.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.6.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.7.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.7.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.7.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.7.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.7.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.7.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.8.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.8.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.8.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.8.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.8.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.8.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.9.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.9.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.9.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.9.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.9.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.9.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.10.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.10.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.10.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.10.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.10.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.10.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.11.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.11.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.11.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.11.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.11.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.11.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.12.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.12.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.12.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.12.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.12.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.12.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.13.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.13.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.13.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.13.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.13.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.13.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.14.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.14.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.14.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.14.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.14.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.14.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.15.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.15.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.15.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.15.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.15.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.15.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.16.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.16.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.16.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.16.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.16.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.16.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.17.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.17.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.17.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.17.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.17.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.17.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.18.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.18.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.18.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.18.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.18.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.18.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.19.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.19.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.19.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.19.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.19.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.19.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.20.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.20.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.20.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.20.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.20.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.20.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.21.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.21.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.21.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.21.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.21.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.21.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.22.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.22.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.22.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.22.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.22.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.22.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.23.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.23.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.23.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.23.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.23.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.23.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.24.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.24.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.24.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.24.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.24.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.24.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.25.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.25.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.25.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.25.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.25.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.25.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.26.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.26.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.26.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.26.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.26.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.26.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.27.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.27.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.27.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.27.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.27.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.27.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.28.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.28.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.28.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.28.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.28.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.28.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.29.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.29.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.29.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.29.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.29.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.29.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.30.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.30.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.30.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.30.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.30.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.30.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.31.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.31.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.31.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.31.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.31.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.31.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.32.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.32.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.32.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.32.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.32.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.32.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.33.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.33.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.33.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.33.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.33.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.33.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.34.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.34.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.34.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.34.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.34.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.34.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.35.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.35.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.35.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.35.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.35.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.35.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.36.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.36.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.36.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.36.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.36.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.36.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.37.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.37.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.37.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.37.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.37.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.37.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.38.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.38.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.38.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.38.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.38.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.38.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.39.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.39.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.39.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.39.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.39.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.39.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.40.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.40.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.40.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.40.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.40.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.40.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.41.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.41.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.41.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.41.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.41.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.41.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.42.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.42.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.42.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.42.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.42.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.42.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.43.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.43.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.43.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.43.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.43.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.43.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.44.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.44.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.44.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.44.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.44.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.44.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.45.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.45.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.45.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.45.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.45.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.45.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.46.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.46.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.46.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.46.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.46.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.46.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.47.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.47.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.47.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.47.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.47.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.47.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.48.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.48.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.48.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.48.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.48.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.48.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.49.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.49.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.49.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.49.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.49.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.49.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.50.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.50.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.50.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.50.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.50.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.50.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.51.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.51.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.51.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.51.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.51.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.51.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.52.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.52.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.52.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.52.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.52.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.52.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.53.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.53.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.53.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.53.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.53.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.53.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.54.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.54.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.54.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.54.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.54.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.54.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.55.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.55.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.55.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.55.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.55.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.55.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.56.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.56.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.56.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.56.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.56.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.56.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.57.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.57.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.57.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.57.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.57.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.57.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.58.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.58.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.58.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.58.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.58.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.58.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.59.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.59.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.59.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.59.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.59.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.59.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.60.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.60.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.60.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.60.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.60.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.60.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.61.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.61.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.61.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.61.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.61.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.61.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.62.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.62.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.62.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.62.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.62.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.62.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.63.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.63.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.63.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.63.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.63.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.63.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.64.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.64.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.64.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.64.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.64.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.64.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.65.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.65.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.65.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.65.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.65.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.65.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.66.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.66.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.66.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.66.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.66.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.66.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.67.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.67.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.67.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.67.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.67.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.67.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.68.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.68.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.68.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.68.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.68.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.68.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.69.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.69.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.69.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.69.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.69.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.69.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.70.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.70.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.70.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.70.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.70.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.70.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.71.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.71.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.71.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.71.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.71.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.71.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.72.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.72.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.72.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.72.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.72.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.72.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.73.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.73.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.73.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.73.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.73.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.73.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.74.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.74.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.74.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.74.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.74.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.74.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.75.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.75.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.75.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.75.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.75.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.75.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.76.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.76.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.76.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.76.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.76.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.76.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.77.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.77.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.77.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.77.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.77.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.77.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.78.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.78.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.78.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.78.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.78.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.78.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.79.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.79.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.79.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.79.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.79.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.79.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.80.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.80.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.80.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.80.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.80.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.80.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.81.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.81.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.81.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.81.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.81.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.81.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.82.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.82.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.82.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.82.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.82.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.82.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.83.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.83.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.83.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.83.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.83.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.83.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.84.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.84.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.84.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.84.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.84.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.84.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.85.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.85.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.85.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.85.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.85.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.85.down_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.86.gate_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.86.gate_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.86.up_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.86.up_proj.weight_scale_inv": "model-00051-of-000163.safetensors", "model.layers.21.mlp.experts.86.down_proj.weight": "model-00051-of-000163.safetensors", - "model.layers.21.mlp.experts.86.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.87.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.87.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.87.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.87.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.87.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.87.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.88.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.88.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.88.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.88.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.88.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.88.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.89.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.89.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.89.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.89.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.89.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.89.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.90.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.90.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.90.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.90.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.90.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.90.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.91.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.91.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.91.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.91.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.91.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.91.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.92.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.92.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.92.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.92.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.92.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.92.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.93.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.93.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.93.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.93.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.93.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.93.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.94.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.94.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.94.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.94.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.94.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.94.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.95.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.95.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.95.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.95.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.95.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.95.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.96.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.96.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.96.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.96.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.96.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.96.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.97.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.97.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.97.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.97.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.97.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.97.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.98.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.98.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.98.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.98.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.98.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.98.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.99.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.99.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.99.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.99.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.99.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.99.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.100.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.100.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.100.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.100.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.100.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.100.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.101.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.101.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.101.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.101.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.101.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.101.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.102.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.102.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.102.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.102.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.102.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.102.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.103.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.103.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.103.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.103.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.103.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.103.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.104.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.104.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.104.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.104.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.104.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.104.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.105.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.105.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.105.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.105.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.105.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.105.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.106.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.106.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.106.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.106.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.106.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.106.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.107.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.107.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.107.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.107.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.107.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.107.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.108.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.108.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.108.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.108.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.108.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.108.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.109.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.109.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.109.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.109.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.109.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.109.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.110.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.110.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.110.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.110.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.110.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.110.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.111.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.111.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.111.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.111.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.111.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.111.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.112.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.112.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.112.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.112.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.112.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.112.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.113.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.113.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.113.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.113.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.113.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.113.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.114.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.114.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.114.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.114.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.114.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.114.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.115.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.115.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.115.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.115.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.115.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.115.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.116.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.116.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.116.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.116.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.116.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.116.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.117.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.117.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.117.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.117.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.117.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.117.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.118.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.118.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.118.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.118.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.118.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.118.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.119.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.119.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.119.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.119.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.119.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.119.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.120.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.120.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.120.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.120.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.120.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.120.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.121.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.121.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.121.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.121.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.121.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.121.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.122.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.122.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.122.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.122.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.122.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.122.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.123.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.123.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.123.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.123.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.123.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.123.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.124.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.124.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.124.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.124.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.124.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.124.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.125.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.125.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.125.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.125.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.125.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.125.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.126.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.126.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.126.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.126.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.126.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.126.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.127.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.127.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.127.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.127.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.127.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.127.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.128.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.128.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.128.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.128.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.128.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.128.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.129.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.129.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.129.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.129.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.129.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.129.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.130.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.130.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.130.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.130.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.130.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.130.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.131.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.131.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.131.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.131.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.131.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.131.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.132.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.132.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.132.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.132.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.132.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.132.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.133.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.133.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.133.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.133.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.133.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.133.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.134.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.134.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.134.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.134.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.134.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.134.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.135.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.135.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.135.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.135.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.135.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.135.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.136.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.136.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.136.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.136.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.136.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.136.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.137.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.137.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.137.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.137.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.137.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.137.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.138.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.138.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.138.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.138.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.138.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.138.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.139.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.139.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.139.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.139.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.139.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.139.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.140.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.140.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.140.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.140.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.140.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.140.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.141.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.141.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.141.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.141.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.141.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.141.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.142.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.142.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.142.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.142.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.142.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.142.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.143.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.143.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.143.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.143.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.143.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.143.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.144.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.144.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.144.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.144.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.144.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.144.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.145.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.145.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.145.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.145.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.145.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.145.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.146.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.146.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.146.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.146.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.146.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.146.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.147.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.147.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.147.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.147.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.147.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.147.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.148.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.148.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.148.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.148.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.148.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.148.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.149.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.149.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.149.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.149.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.149.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.149.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.150.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.150.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.150.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.150.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.150.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.150.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.151.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.151.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.151.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.151.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.151.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.151.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.152.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.152.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.152.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.152.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.152.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.152.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.153.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.153.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.153.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.153.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.153.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.153.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.154.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.154.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.154.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.154.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.154.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.154.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.155.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.155.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.155.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.155.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.155.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.155.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.156.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.156.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.156.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.156.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.156.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.156.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.157.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.157.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.157.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.157.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.157.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.157.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.158.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.158.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.158.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.158.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.158.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.158.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.159.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.159.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.159.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.159.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.159.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.159.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.160.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.160.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.160.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.160.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.160.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.160.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.161.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.161.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.161.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.161.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.161.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.161.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.162.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.162.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.162.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.162.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.162.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.162.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.163.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.163.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.163.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.163.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.163.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.163.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.164.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.164.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.164.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.164.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.164.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.164.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.165.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.165.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.165.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.165.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.165.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.165.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.166.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.166.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.166.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.166.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.166.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.166.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.167.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.167.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.167.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.167.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.167.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.167.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.168.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.168.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.168.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.168.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.168.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.168.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.169.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.169.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.169.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.169.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.169.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.169.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.170.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.170.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.170.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.170.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.170.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.170.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.171.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.171.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.171.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.171.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.171.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.171.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.172.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.172.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.172.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.172.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.172.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.172.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.173.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.173.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.173.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.173.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.173.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.173.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.174.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.174.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.174.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.174.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.174.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.174.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.175.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.175.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.175.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.175.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.175.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.175.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.176.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.176.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.176.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.176.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.176.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.176.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.177.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.177.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.177.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.177.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.177.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.177.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.178.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.178.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.178.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.178.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.178.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.178.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.179.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.179.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.179.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.179.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.179.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.179.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.180.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.180.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.180.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.180.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.180.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.180.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.181.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.181.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.181.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.181.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.181.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.181.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.182.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.182.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.182.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.182.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.182.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.182.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.183.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.183.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.183.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.183.up_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.183.down_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.183.down_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.184.gate_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.184.gate_proj.weight_scale_inv": "model-00052-of-000163.safetensors", "model.layers.21.mlp.experts.184.up_proj.weight": "model-00052-of-000163.safetensors", - "model.layers.21.mlp.experts.184.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.184.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.184.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.185.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.185.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.185.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.185.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.185.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.185.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.186.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.186.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.186.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.186.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.186.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.186.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.187.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.187.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.187.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.187.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.187.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.187.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.188.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.188.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.188.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.188.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.188.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.188.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.189.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.189.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.189.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.189.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.189.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.189.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.190.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.190.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.190.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.190.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.190.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.190.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.191.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.191.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.191.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.191.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.191.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.191.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.192.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.192.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.192.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.192.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.192.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.192.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.193.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.193.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.193.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.193.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.193.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.193.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.194.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.194.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.194.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.194.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.194.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.194.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.195.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.195.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.195.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.195.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.195.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.195.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.196.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.196.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.196.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.196.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.196.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.196.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.197.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.197.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.197.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.197.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.197.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.197.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.198.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.198.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.198.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.198.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.198.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.198.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.199.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.199.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.199.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.199.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.199.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.199.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.200.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.200.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.200.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.200.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.200.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.200.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.201.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.201.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.201.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.201.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.201.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.201.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.202.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.202.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.202.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.202.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.202.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.202.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.203.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.203.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.203.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.203.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.203.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.203.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.204.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.204.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.204.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.204.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.204.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.204.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.205.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.205.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.205.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.205.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.205.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.205.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.206.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.206.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.206.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.206.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.206.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.206.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.207.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.207.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.207.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.207.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.207.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.207.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.208.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.208.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.208.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.208.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.208.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.208.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.209.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.209.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.209.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.209.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.209.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.209.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.210.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.210.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.210.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.210.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.210.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.210.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.211.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.211.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.211.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.211.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.211.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.211.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.212.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.212.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.212.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.212.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.212.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.212.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.213.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.213.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.213.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.213.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.213.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.213.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.214.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.214.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.214.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.214.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.214.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.214.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.215.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.215.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.215.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.215.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.215.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.215.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.216.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.216.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.216.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.216.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.216.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.216.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.217.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.217.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.217.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.217.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.217.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.217.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.218.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.218.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.218.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.218.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.218.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.218.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.219.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.219.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.219.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.219.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.219.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.219.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.220.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.220.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.220.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.220.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.220.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.220.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.221.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.221.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.221.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.221.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.221.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.221.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.222.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.222.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.222.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.222.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.222.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.222.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.223.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.223.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.223.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.223.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.223.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.223.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.224.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.224.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.224.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.224.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.224.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.224.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.225.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.225.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.225.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.225.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.225.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.225.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.226.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.226.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.226.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.226.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.226.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.226.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.227.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.227.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.227.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.227.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.227.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.227.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.228.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.228.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.228.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.228.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.228.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.228.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.229.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.229.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.229.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.229.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.229.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.229.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.230.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.230.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.230.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.230.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.230.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.230.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.231.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.231.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.231.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.231.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.231.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.231.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.232.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.232.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.232.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.232.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.232.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.232.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.233.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.233.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.233.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.233.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.233.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.233.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.234.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.234.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.234.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.234.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.234.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.234.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.235.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.235.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.235.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.235.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.235.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.235.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.236.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.236.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.236.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.236.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.236.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.236.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.237.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.237.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.237.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.237.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.237.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.237.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.238.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.238.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.238.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.238.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.238.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.238.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.239.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.239.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.239.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.239.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.239.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.239.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.240.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.240.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.240.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.240.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.240.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.240.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.241.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.241.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.241.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.241.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.241.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.241.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.242.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.242.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.242.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.242.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.242.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.242.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.243.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.243.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.243.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.243.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.243.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.243.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.244.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.244.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.244.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.244.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.244.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.244.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.245.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.245.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.245.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.245.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.245.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.245.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.246.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.246.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.246.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.246.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.246.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.246.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.247.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.247.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.247.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.247.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.247.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.247.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.248.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.248.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.248.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.248.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.248.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.248.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.249.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.249.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.249.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.249.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.249.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.249.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.250.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.250.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.250.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.250.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.250.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.250.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.251.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.251.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.251.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.251.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.251.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.251.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.252.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.252.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.252.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.252.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.252.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.252.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.253.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.253.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.253.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.253.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.253.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.253.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.254.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.254.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.254.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.254.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.254.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.254.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.255.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.255.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.255.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.255.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.mlp.experts.255.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.21.mlp.experts.255.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.21.input_layernorm.weight": "model-00053-of-000163.safetensors", "model.layers.21.post_attention_layernorm.weight": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.q_a_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.self_attn.q_a_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.q_a_layernorm.weight": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.q_b_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.self_attn.q_b_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.kv_a_proj_with_mqa.weight": "model-00053-of-000163.safetensors", - "model.layers.22.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.kv_a_layernorm.weight": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.kv_b_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.self_attn.kv_b_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.self_attn.o_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.self_attn.o_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.gate.weight": "model-00053-of-000163.safetensors", "model.layers.22.mlp.gate.e_score_correction_bias": "model-00053-of-000163.safetensors", "model.layers.22.mlp.shared_experts.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.shared_experts.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.shared_experts.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.shared_experts.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.shared_experts.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.0.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.0.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.0.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.0.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.0.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.0.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.1.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.1.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.1.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.1.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.1.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.1.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.2.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.2.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.2.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.2.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.2.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.2.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.3.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.3.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.3.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.3.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.3.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.3.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.4.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.4.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.4.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.4.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.4.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.4.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.5.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.5.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.5.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.5.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.5.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.5.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.6.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.6.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.6.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.6.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.6.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.6.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.7.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.7.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.7.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.7.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.7.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.7.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.8.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.8.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.8.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.8.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.8.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.8.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.9.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.9.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.9.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.9.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.9.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.9.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.10.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.10.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.10.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.10.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.10.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.10.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.11.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.11.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.11.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.11.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.11.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.11.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.12.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.12.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.12.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.12.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.12.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.12.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.13.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.13.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.13.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.13.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.13.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.13.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.14.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.14.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.14.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.14.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.14.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.14.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.15.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.15.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.15.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.15.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.15.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.15.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.16.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.16.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.16.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.16.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.16.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.16.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.17.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.17.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.17.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.17.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.17.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.17.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.18.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.18.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.18.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.18.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.18.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.18.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.19.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.19.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.19.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.19.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.19.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.19.down_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.20.gate_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.20.gate_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.20.up_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.20.up_proj.weight_scale_inv": "model-00053-of-000163.safetensors", "model.layers.22.mlp.experts.20.down_proj.weight": "model-00053-of-000163.safetensors", - "model.layers.22.mlp.experts.20.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.21.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.21.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.21.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.21.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.21.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.21.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.22.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.22.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.22.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.22.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.22.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.22.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.23.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.23.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.23.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.23.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.23.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.23.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.24.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.24.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.24.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.24.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.24.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.24.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.25.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.25.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.25.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.25.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.25.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.25.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.26.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.26.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.26.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.26.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.26.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.26.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.27.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.27.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.27.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.27.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.27.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.27.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.28.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.28.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.28.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.28.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.28.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.28.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.29.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.29.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.29.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.29.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.29.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.29.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.30.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.30.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.30.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.30.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.30.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.30.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.31.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.31.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.31.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.31.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.31.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.31.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.32.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.32.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.32.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.32.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.32.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.32.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.33.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.33.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.33.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.33.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.33.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.33.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.34.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.34.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.34.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.34.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.34.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.34.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.35.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.35.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.35.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.35.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.35.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.35.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.36.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.36.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.36.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.36.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.36.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.36.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.37.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.37.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.37.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.37.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.37.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.37.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.38.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.38.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.38.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.38.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.38.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.38.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.39.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.39.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.39.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.39.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.39.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.39.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.40.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.40.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.40.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.40.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.40.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.40.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.41.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.41.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.41.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.41.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.41.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.41.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.42.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.42.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.42.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.42.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.42.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.42.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.43.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.43.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.43.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.43.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.43.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.43.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.44.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.44.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.44.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.44.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.44.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.44.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.45.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.45.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.45.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.45.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.45.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.45.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.46.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.46.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.46.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.46.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.46.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.46.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.47.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.47.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.47.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.47.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.47.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.47.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.48.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.48.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.48.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.48.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.48.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.48.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.49.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.49.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.49.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.49.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.49.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.49.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.50.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.50.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.50.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.50.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.50.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.50.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.51.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.51.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.51.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.51.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.51.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.51.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.52.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.52.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.52.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.52.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.52.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.52.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.53.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.53.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.53.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.53.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.53.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.53.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.54.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.54.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.54.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.54.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.54.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.54.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.55.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.55.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.55.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.55.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.55.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.55.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.56.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.56.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.56.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.56.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.56.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.56.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.57.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.57.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.57.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.57.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.57.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.57.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.58.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.58.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.58.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.58.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.58.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.58.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.59.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.59.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.59.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.59.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.59.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.59.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.60.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.60.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.60.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.60.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.60.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.60.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.61.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.61.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.61.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.61.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.61.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.61.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.62.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.62.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.62.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.62.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.62.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.62.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.63.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.63.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.63.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.63.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.63.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.63.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.64.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.64.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.64.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.64.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.64.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.64.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.65.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.65.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.65.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.65.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.65.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.65.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.66.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.66.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.66.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.66.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.66.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.66.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.67.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.67.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.67.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.67.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.67.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.67.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.68.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.68.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.68.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.68.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.68.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.68.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.69.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.69.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.69.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.69.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.69.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.69.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.70.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.70.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.70.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.70.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.70.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.70.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.71.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.71.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.71.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.71.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.71.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.71.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.72.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.72.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.72.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.72.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.72.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.72.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.73.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.73.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.73.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.73.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.73.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.73.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.74.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.74.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.74.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.74.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.74.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.74.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.75.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.75.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.75.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.75.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.75.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.75.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.76.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.76.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.76.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.76.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.76.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.76.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.77.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.77.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.77.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.77.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.77.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.77.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.78.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.78.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.78.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.78.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.78.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.78.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.79.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.79.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.79.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.79.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.79.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.79.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.80.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.80.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.80.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.80.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.80.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.80.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.81.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.81.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.81.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.81.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.81.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.81.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.82.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.82.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.82.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.82.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.82.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.82.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.83.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.83.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.83.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.83.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.83.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.83.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.84.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.84.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.84.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.84.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.84.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.84.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.85.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.85.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.85.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.85.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.85.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.85.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.86.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.86.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.86.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.86.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.86.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.86.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.87.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.87.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.87.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.87.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.87.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.87.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.88.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.88.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.88.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.88.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.88.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.88.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.89.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.89.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.89.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.89.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.89.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.89.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.90.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.90.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.90.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.90.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.90.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.90.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.91.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.91.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.91.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.91.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.91.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.91.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.92.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.92.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.92.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.92.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.92.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.92.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.93.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.93.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.93.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.93.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.93.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.93.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.94.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.94.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.94.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.94.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.94.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.94.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.95.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.95.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.95.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.95.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.95.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.95.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.96.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.96.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.96.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.96.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.96.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.96.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.97.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.97.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.97.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.97.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.97.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.97.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.98.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.98.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.98.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.98.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.98.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.98.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.99.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.99.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.99.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.99.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.99.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.99.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.100.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.100.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.100.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.100.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.100.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.100.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.101.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.101.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.101.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.101.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.101.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.101.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.102.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.102.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.102.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.102.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.102.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.102.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.103.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.103.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.103.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.103.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.103.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.103.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.104.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.104.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.104.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.104.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.104.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.104.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.105.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.105.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.105.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.105.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.105.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.105.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.106.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.106.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.106.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.106.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.106.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.106.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.107.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.107.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.107.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.107.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.107.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.107.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.108.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.108.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.108.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.108.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.108.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.108.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.109.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.109.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.109.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.109.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.109.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.109.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.110.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.110.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.110.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.110.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.110.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.110.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.111.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.111.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.111.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.111.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.111.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.111.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.112.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.112.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.112.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.112.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.112.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.112.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.113.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.113.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.113.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.113.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.113.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.113.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.114.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.114.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.114.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.114.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.114.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.114.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.115.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.115.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.115.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.115.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.115.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.115.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.116.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.116.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.116.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.116.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.116.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.116.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.117.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.117.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.117.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.117.up_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.117.down_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.117.down_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.118.gate_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.118.gate_proj.weight_scale_inv": "model-00054-of-000163.safetensors", "model.layers.22.mlp.experts.118.up_proj.weight": "model-00054-of-000163.safetensors", - "model.layers.22.mlp.experts.118.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.118.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.118.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.119.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.119.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.119.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.119.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.119.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.119.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.120.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.120.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.120.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.120.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.120.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.120.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.121.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.121.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.121.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.121.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.121.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.121.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.122.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.122.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.122.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.122.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.122.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.122.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.123.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.123.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.123.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.123.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.123.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.123.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.124.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.124.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.124.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.124.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.124.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.124.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.125.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.125.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.125.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.125.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.125.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.125.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.126.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.126.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.126.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.126.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.126.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.126.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.127.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.127.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.127.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.127.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.127.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.127.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.128.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.128.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.128.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.128.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.128.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.128.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.129.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.129.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.129.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.129.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.129.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.129.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.130.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.130.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.130.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.130.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.130.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.130.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.131.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.131.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.131.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.131.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.131.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.131.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.132.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.132.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.132.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.132.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.132.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.132.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.133.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.133.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.133.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.133.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.133.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.133.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.134.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.134.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.134.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.134.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.134.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.134.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.135.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.135.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.135.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.135.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.135.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.135.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.136.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.136.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.136.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.136.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.136.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.136.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.137.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.137.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.137.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.137.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.137.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.137.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.138.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.138.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.138.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.138.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.138.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.138.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.139.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.139.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.139.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.139.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.139.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.139.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.140.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.140.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.140.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.140.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.140.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.140.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.141.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.141.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.141.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.141.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.141.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.141.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.142.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.142.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.142.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.142.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.142.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.142.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.143.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.143.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.143.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.143.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.143.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.143.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.144.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.144.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.144.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.144.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.144.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.144.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.145.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.145.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.145.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.145.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.145.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.145.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.146.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.146.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.146.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.146.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.146.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.146.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.147.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.147.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.147.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.147.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.147.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.147.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.148.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.148.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.148.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.148.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.148.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.148.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.149.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.149.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.149.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.149.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.149.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.149.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.150.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.150.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.150.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.150.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.150.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.150.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.151.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.151.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.151.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.151.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.151.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.151.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.152.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.152.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.152.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.152.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.152.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.152.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.153.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.153.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.153.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.153.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.153.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.153.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.154.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.154.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.154.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.154.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.154.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.154.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.155.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.155.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.155.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.155.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.155.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.155.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.156.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.156.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.156.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.156.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.156.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.156.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.157.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.157.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.157.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.157.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.157.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.157.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.158.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.158.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.158.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.158.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.158.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.158.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.159.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.159.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.159.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.159.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.159.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.159.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.160.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.160.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.160.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.160.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.160.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.160.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.161.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.161.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.161.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.161.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.161.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.161.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.162.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.162.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.162.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.162.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.162.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.162.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.163.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.163.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.163.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.163.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.163.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.163.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.164.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.164.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.164.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.164.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.164.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.164.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.165.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.165.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.165.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.165.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.165.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.165.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.166.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.166.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.166.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.166.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.166.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.166.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.167.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.167.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.167.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.167.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.167.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.167.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.168.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.168.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.168.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.168.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.168.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.168.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.169.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.169.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.169.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.169.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.169.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.169.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.170.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.170.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.170.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.170.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.170.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.170.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.171.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.171.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.171.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.171.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.171.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.171.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.172.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.172.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.172.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.172.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.172.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.172.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.173.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.173.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.173.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.173.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.173.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.173.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.174.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.174.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.174.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.174.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.174.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.174.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.175.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.175.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.175.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.175.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.175.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.175.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.176.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.176.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.176.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.176.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.176.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.176.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.177.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.177.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.177.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.177.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.177.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.177.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.178.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.178.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.178.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.178.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.178.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.178.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.179.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.179.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.179.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.179.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.179.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.179.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.180.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.180.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.180.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.180.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.180.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.180.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.181.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.181.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.181.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.181.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.181.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.181.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.182.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.182.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.182.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.182.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.182.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.182.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.183.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.183.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.183.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.183.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.183.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.183.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.184.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.184.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.184.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.184.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.184.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.184.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.185.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.185.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.185.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.185.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.185.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.185.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.186.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.186.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.186.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.186.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.186.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.186.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.187.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.187.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.187.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.187.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.187.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.187.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.188.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.188.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.188.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.188.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.188.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.188.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.189.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.189.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.189.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.189.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.189.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.189.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.190.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.190.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.190.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.190.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.190.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.190.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.191.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.191.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.191.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.191.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.191.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.191.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.192.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.192.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.192.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.192.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.192.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.192.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.193.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.193.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.193.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.193.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.193.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.193.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.194.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.194.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.194.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.194.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.194.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.194.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.195.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.195.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.195.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.195.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.195.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.195.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.196.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.196.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.196.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.196.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.196.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.196.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.197.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.197.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.197.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.197.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.197.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.197.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.198.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.198.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.198.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.198.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.198.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.198.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.199.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.199.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.199.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.199.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.199.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.199.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.200.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.200.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.200.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.200.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.200.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.200.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.201.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.201.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.201.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.201.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.201.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.201.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.202.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.202.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.202.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.202.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.202.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.202.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.203.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.203.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.203.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.203.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.203.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.203.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.204.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.204.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.204.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.204.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.204.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.204.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.205.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.205.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.205.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.205.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.205.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.205.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.206.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.206.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.206.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.206.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.206.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.206.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.207.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.207.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.207.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.207.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.207.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.207.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.208.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.208.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.208.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.208.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.208.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.208.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.209.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.209.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.209.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.209.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.209.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.209.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.210.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.210.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.210.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.210.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.210.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.210.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.211.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.211.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.211.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.211.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.211.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.211.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.212.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.212.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.212.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.212.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.212.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.212.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.213.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.213.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.213.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.213.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.213.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.213.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.214.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.214.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.214.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.214.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.214.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.214.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.215.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.215.gate_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.215.up_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.215.up_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.215.down_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.215.down_proj.weight_scale_inv": "model-00055-of-000163.safetensors", "model.layers.22.mlp.experts.216.gate_proj.weight": "model-00055-of-000163.safetensors", - "model.layers.22.mlp.experts.216.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.216.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.216.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.216.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.216.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.217.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.217.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.217.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.217.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.217.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.217.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.218.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.218.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.218.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.218.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.218.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.218.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.219.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.219.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.219.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.219.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.219.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.219.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.220.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.220.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.220.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.220.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.220.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.220.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.221.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.221.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.221.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.221.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.221.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.221.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.222.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.222.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.222.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.222.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.222.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.222.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.223.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.223.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.223.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.223.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.223.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.223.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.224.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.224.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.224.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.224.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.224.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.224.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.225.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.225.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.225.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.225.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.225.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.225.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.226.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.226.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.226.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.226.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.226.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.226.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.227.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.227.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.227.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.227.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.227.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.227.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.228.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.228.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.228.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.228.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.228.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.228.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.229.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.229.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.229.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.229.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.229.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.229.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.230.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.230.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.230.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.230.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.230.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.230.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.231.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.231.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.231.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.231.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.231.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.231.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.232.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.232.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.232.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.232.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.232.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.232.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.233.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.233.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.233.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.233.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.233.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.233.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.234.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.234.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.234.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.234.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.234.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.234.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.235.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.235.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.235.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.235.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.235.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.235.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.236.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.236.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.236.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.236.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.236.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.236.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.237.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.237.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.237.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.237.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.237.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.237.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.238.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.238.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.238.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.238.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.238.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.238.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.239.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.239.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.239.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.239.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.239.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.239.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.240.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.240.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.240.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.240.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.240.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.240.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.241.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.241.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.241.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.241.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.241.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.241.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.242.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.242.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.242.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.242.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.242.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.242.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.243.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.243.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.243.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.243.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.243.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.243.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.244.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.244.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.244.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.244.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.244.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.244.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.245.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.245.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.245.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.245.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.245.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.245.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.246.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.246.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.246.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.246.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.246.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.246.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.247.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.247.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.247.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.247.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.247.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.247.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.248.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.248.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.248.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.248.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.248.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.248.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.249.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.249.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.249.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.249.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.249.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.249.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.250.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.250.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.250.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.250.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.250.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.250.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.251.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.251.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.251.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.251.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.251.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.251.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.252.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.252.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.252.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.252.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.252.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.252.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.253.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.253.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.253.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.253.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.253.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.253.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.254.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.254.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.254.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.254.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.254.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.254.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.255.gate_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.255.gate_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.255.up_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.255.up_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.mlp.experts.255.down_proj.weight": "model-00056-of-000163.safetensors", - "model.layers.22.mlp.experts.255.down_proj.weight_scale_inv": "model-00056-of-000163.safetensors", "model.layers.22.input_layernorm.weight": "model-00056-of-000163.safetensors", "model.layers.22.post_attention_layernorm.weight": "model-00056-of-000163.safetensors", "model.layers.23.self_attn.q_a_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.self_attn.q_a_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.q_a_layernorm.weight": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.q_b_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.self_attn.q_b_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.kv_a_proj_with_mqa.weight": "model-00057-of-000163.safetensors", - "model.layers.23.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.kv_a_layernorm.weight": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.kv_b_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.self_attn.kv_b_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.self_attn.o_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.self_attn.o_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.gate.weight": "model-00057-of-000163.safetensors", "model.layers.23.mlp.gate.e_score_correction_bias": "model-00057-of-000163.safetensors", "model.layers.23.mlp.shared_experts.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.shared_experts.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.shared_experts.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.shared_experts.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.shared_experts.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.0.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.0.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.0.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.0.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.0.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.0.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.1.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.1.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.1.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.1.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.1.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.1.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.2.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.2.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.2.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.2.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.2.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.2.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.3.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.3.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.3.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.3.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.3.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.3.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.4.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.4.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.4.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.4.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.4.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.4.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.5.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.5.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.5.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.5.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.5.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.5.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.6.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.6.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.6.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.6.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.6.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.6.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.7.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.7.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.7.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.7.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.7.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.7.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.8.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.8.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.8.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.8.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.8.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.8.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.9.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.9.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.9.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.9.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.9.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.9.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.10.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.10.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.10.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.10.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.10.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.10.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.11.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.11.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.11.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.11.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.11.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.11.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.12.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.12.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.12.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.12.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.12.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.12.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.13.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.13.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.13.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.13.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.13.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.13.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.14.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.14.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.14.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.14.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.14.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.14.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.15.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.15.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.15.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.15.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.15.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.15.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.16.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.16.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.16.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.16.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.16.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.16.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.17.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.17.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.17.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.17.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.17.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.17.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.18.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.18.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.18.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.18.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.18.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.18.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.19.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.19.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.19.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.19.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.19.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.19.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.20.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.20.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.20.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.20.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.20.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.20.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.21.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.21.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.21.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.21.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.21.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.21.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.22.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.22.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.22.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.22.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.22.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.22.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.23.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.23.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.23.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.23.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.23.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.23.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.24.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.24.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.24.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.24.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.24.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.24.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.25.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.25.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.25.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.25.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.25.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.25.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.26.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.26.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.26.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.26.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.26.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.26.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.27.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.27.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.27.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.27.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.27.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.27.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.28.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.28.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.28.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.28.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.28.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.28.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.29.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.29.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.29.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.29.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.29.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.29.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.30.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.30.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.30.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.30.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.30.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.30.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.31.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.31.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.31.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.31.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.31.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.31.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.32.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.32.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.32.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.32.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.32.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.32.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.33.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.33.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.33.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.33.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.33.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.33.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.34.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.34.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.34.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.34.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.34.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.34.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.35.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.35.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.35.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.35.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.35.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.35.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.36.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.36.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.36.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.36.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.36.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.36.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.37.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.37.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.37.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.37.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.37.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.37.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.38.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.38.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.38.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.38.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.38.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.38.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.39.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.39.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.39.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.39.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.39.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.39.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.40.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.40.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.40.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.40.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.40.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.40.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.41.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.41.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.41.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.41.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.41.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.41.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.42.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.42.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.42.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.42.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.42.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.42.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.43.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.43.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.43.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.43.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.43.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.43.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.44.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.44.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.44.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.44.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.44.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.44.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.45.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.45.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.45.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.45.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.45.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.45.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.46.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.46.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.46.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.46.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.46.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.46.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.47.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.47.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.47.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.47.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.47.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.47.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.48.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.48.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.48.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.48.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.48.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.48.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.49.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.49.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.49.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.49.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.49.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.49.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.50.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.50.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.50.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.50.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.50.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.50.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.51.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.51.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.51.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.51.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.51.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.51.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.52.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.52.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.52.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.52.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.52.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.52.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.53.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.53.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.53.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.53.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.53.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.53.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.54.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.54.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.54.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.54.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.54.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.54.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.55.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.55.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.55.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.55.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.55.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.55.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.56.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.56.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.56.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.56.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.56.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.56.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.57.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.57.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.57.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.57.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.57.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.57.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.58.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.58.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.58.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.58.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.58.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.58.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.59.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.59.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.59.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.59.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.59.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.59.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.60.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.60.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.60.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.60.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.60.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.60.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.61.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.61.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.61.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.61.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.61.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.61.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.62.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.62.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.62.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.62.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.62.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.62.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.63.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.63.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.63.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.63.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.63.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.63.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.64.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.64.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.64.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.64.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.64.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.64.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.65.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.65.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.65.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.65.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.65.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.65.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.66.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.66.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.66.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.66.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.66.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.66.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.67.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.67.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.67.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.67.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.67.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.67.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.68.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.68.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.68.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.68.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.68.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.68.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.69.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.69.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.69.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.69.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.69.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.69.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.70.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.70.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.70.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.70.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.70.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.70.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.71.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.71.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.71.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.71.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.71.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.71.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.72.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.72.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.72.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.72.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.72.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.72.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.73.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.73.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.73.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.73.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.73.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.73.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.74.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.74.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.74.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.74.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.74.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.74.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.75.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.75.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.75.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.75.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.75.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.75.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.76.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.76.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.76.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.76.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.76.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.76.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.77.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.77.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.77.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.77.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.77.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.77.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.78.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.78.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.78.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.78.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.78.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.78.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.79.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.79.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.79.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.79.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.79.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.79.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.80.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.80.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.80.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.80.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.80.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.80.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.81.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.81.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.81.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.81.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.81.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.81.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.82.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.82.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.82.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.82.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.82.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.82.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.83.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.83.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.83.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.83.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.83.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.83.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.84.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.84.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.84.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.84.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.84.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.84.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.85.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.85.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.85.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.85.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.85.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.85.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.86.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.86.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.86.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.86.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.86.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.86.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.87.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.87.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.87.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.87.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.87.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.87.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.88.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.88.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.88.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.88.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.88.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.88.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.89.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.89.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.89.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.89.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.89.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.89.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.90.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.90.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.90.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.90.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.90.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.90.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.91.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.91.gate_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.91.up_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.91.up_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.91.down_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.91.down_proj.weight_scale_inv": "model-00057-of-000163.safetensors", "model.layers.23.mlp.experts.92.gate_proj.weight": "model-00057-of-000163.safetensors", - "model.layers.23.mlp.experts.92.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.92.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.92.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.92.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.92.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.93.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.93.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.93.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.93.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.93.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.93.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.94.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.94.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.94.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.94.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.94.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.94.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.95.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.95.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.95.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.95.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.95.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.95.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.96.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.96.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.96.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.96.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.96.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.96.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.97.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.97.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.97.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.97.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.97.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.97.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.98.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.98.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.98.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.98.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.98.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.98.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.99.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.99.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.99.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.99.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.99.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.99.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.100.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.100.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.100.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.100.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.100.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.100.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.101.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.101.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.101.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.101.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.101.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.101.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.102.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.102.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.102.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.102.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.102.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.102.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.103.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.103.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.103.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.103.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.103.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.103.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.104.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.104.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.104.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.104.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.104.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.104.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.105.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.105.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.105.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.105.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.105.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.105.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.106.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.106.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.106.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.106.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.106.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.106.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.107.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.107.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.107.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.107.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.107.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.107.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.108.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.108.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.108.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.108.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.108.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.108.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.109.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.109.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.109.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.109.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.109.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.109.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.110.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.110.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.110.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.110.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.110.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.110.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.111.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.111.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.111.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.111.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.111.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.111.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.112.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.112.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.112.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.112.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.112.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.112.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.113.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.113.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.113.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.113.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.113.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.113.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.114.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.114.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.114.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.114.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.114.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.114.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.115.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.115.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.115.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.115.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.115.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.115.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.116.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.116.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.116.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.116.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.116.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.116.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.117.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.117.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.117.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.117.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.117.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.117.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.118.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.118.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.118.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.118.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.118.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.118.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.119.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.119.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.119.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.119.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.119.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.119.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.120.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.120.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.120.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.120.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.120.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.120.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.121.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.121.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.121.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.121.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.121.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.121.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.122.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.122.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.122.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.122.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.122.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.122.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.123.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.123.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.123.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.123.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.123.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.123.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.124.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.124.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.124.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.124.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.124.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.124.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.125.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.125.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.125.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.125.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.125.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.125.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.126.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.126.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.126.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.126.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.126.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.126.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.127.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.127.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.127.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.127.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.127.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.127.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.128.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.128.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.128.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.128.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.128.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.128.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.129.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.129.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.129.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.129.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.129.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.129.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.130.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.130.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.130.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.130.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.130.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.130.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.131.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.131.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.131.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.131.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.131.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.131.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.132.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.132.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.132.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.132.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.132.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.132.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.133.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.133.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.133.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.133.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.133.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.133.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.134.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.134.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.134.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.134.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.134.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.134.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.135.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.135.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.135.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.135.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.135.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.135.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.136.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.136.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.136.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.136.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.136.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.136.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.137.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.137.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.137.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.137.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.137.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.137.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.138.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.138.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.138.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.138.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.138.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.138.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.139.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.139.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.139.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.139.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.139.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.139.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.140.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.140.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.140.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.140.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.140.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.140.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.141.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.141.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.141.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.141.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.141.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.141.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.142.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.142.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.142.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.142.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.142.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.142.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.143.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.143.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.143.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.143.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.143.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.143.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.144.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.144.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.144.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.144.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.144.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.144.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.145.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.145.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.145.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.145.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.145.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.145.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.146.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.146.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.146.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.146.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.146.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.146.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.147.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.147.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.147.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.147.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.147.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.147.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.148.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.148.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.148.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.148.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.148.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.148.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.149.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.149.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.149.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.149.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.149.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.149.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.150.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.150.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.150.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.150.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.150.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.150.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.151.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.151.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.151.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.151.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.151.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.151.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.152.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.152.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.152.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.152.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.152.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.152.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.153.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.153.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.153.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.153.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.153.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.153.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.154.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.154.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.154.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.154.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.154.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.154.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.155.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.155.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.155.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.155.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.155.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.155.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.156.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.156.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.156.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.156.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.156.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.156.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.157.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.157.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.157.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.157.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.157.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.157.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.158.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.158.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.158.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.158.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.158.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.158.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.159.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.159.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.159.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.159.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.159.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.159.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.160.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.160.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.160.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.160.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.160.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.160.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.161.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.161.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.161.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.161.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.161.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.161.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.162.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.162.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.162.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.162.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.162.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.162.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.163.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.163.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.163.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.163.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.163.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.163.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.164.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.164.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.164.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.164.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.164.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.164.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.165.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.165.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.165.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.165.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.165.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.165.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.166.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.166.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.166.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.166.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.166.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.166.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.167.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.167.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.167.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.167.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.167.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.167.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.168.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.168.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.168.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.168.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.168.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.168.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.169.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.169.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.169.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.169.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.169.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.169.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.170.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.170.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.170.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.170.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.170.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.170.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.171.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.171.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.171.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.171.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.171.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.171.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.172.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.172.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.172.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.172.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.172.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.172.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.173.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.173.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.173.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.173.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.173.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.173.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.174.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.174.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.174.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.174.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.174.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.174.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.175.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.175.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.175.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.175.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.175.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.175.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.176.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.176.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.176.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.176.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.176.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.176.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.177.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.177.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.177.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.177.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.177.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.177.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.178.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.178.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.178.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.178.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.178.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.178.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.179.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.179.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.179.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.179.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.179.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.179.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.180.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.180.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.180.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.180.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.180.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.180.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.181.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.181.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.181.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.181.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.181.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.181.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.182.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.182.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.182.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.182.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.182.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.182.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.183.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.183.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.183.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.183.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.183.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.183.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.184.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.184.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.184.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.184.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.184.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.184.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.185.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.185.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.185.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.185.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.185.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.185.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.186.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.186.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.186.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.186.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.186.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.186.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.187.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.187.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.187.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.187.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.187.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.187.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.188.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.188.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.188.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.188.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.188.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.188.down_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.189.gate_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.189.gate_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.189.up_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.189.up_proj.weight_scale_inv": "model-00058-of-000163.safetensors", "model.layers.23.mlp.experts.189.down_proj.weight": "model-00058-of-000163.safetensors", - "model.layers.23.mlp.experts.189.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.190.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.190.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.190.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.190.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.190.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.190.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.191.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.191.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.191.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.191.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.191.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.191.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.192.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.192.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.192.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.192.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.192.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.192.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.193.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.193.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.193.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.193.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.193.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.193.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.194.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.194.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.194.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.194.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.194.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.194.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.195.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.195.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.195.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.195.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.195.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.195.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.196.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.196.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.196.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.196.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.196.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.196.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.197.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.197.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.197.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.197.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.197.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.197.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.198.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.198.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.198.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.198.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.198.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.198.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.199.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.199.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.199.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.199.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.199.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.199.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.200.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.200.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.200.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.200.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.200.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.200.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.201.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.201.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.201.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.201.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.201.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.201.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.202.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.202.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.202.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.202.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.202.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.202.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.203.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.203.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.203.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.203.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.203.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.203.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.204.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.204.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.204.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.204.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.204.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.204.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.205.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.205.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.205.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.205.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.205.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.205.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.206.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.206.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.206.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.206.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.206.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.206.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.207.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.207.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.207.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.207.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.207.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.207.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.208.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.208.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.208.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.208.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.208.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.208.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.209.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.209.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.209.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.209.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.209.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.209.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.210.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.210.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.210.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.210.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.210.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.210.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.211.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.211.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.211.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.211.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.211.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.211.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.212.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.212.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.212.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.212.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.212.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.212.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.213.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.213.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.213.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.213.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.213.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.213.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.214.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.214.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.214.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.214.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.214.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.214.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.215.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.215.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.215.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.215.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.215.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.215.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.216.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.216.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.216.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.216.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.216.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.216.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.217.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.217.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.217.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.217.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.217.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.217.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.218.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.218.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.218.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.218.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.218.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.218.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.219.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.219.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.219.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.219.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.219.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.219.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.220.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.220.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.220.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.220.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.220.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.220.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.221.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.221.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.221.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.221.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.221.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.221.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.222.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.222.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.222.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.222.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.222.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.222.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.223.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.223.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.223.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.223.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.223.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.223.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.224.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.224.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.224.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.224.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.224.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.224.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.225.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.225.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.225.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.225.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.225.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.225.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.226.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.226.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.226.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.226.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.226.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.226.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.227.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.227.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.227.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.227.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.227.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.227.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.228.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.228.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.228.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.228.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.228.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.228.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.229.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.229.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.229.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.229.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.229.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.229.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.230.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.230.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.230.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.230.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.230.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.230.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.231.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.231.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.231.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.231.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.231.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.231.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.232.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.232.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.232.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.232.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.232.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.232.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.233.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.233.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.233.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.233.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.233.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.233.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.234.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.234.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.234.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.234.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.234.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.234.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.235.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.235.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.235.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.235.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.235.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.235.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.236.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.236.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.236.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.236.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.236.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.236.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.237.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.237.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.237.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.237.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.237.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.237.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.238.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.238.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.238.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.238.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.238.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.238.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.239.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.239.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.239.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.239.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.239.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.239.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.240.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.240.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.240.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.240.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.240.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.240.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.241.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.241.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.241.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.241.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.241.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.241.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.242.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.242.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.242.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.242.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.242.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.242.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.243.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.243.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.243.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.243.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.243.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.243.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.244.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.244.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.244.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.244.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.244.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.244.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.245.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.245.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.245.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.245.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.245.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.245.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.246.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.246.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.246.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.246.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.246.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.246.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.247.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.247.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.247.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.247.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.247.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.247.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.248.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.248.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.248.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.248.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.248.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.248.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.249.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.249.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.249.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.249.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.249.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.249.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.250.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.250.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.250.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.250.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.250.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.250.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.251.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.251.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.251.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.251.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.251.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.251.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.252.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.252.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.252.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.252.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.252.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.252.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.253.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.253.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.253.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.253.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.253.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.253.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.254.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.254.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.254.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.254.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.254.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.254.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.255.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.255.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.255.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.255.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.mlp.experts.255.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.23.mlp.experts.255.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.23.input_layernorm.weight": "model-00059-of-000163.safetensors", "model.layers.23.post_attention_layernorm.weight": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.q_a_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.self_attn.q_a_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.q_a_layernorm.weight": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.q_b_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.self_attn.q_b_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.kv_a_proj_with_mqa.weight": "model-00059-of-000163.safetensors", - "model.layers.24.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.kv_a_layernorm.weight": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.kv_b_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.self_attn.kv_b_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.self_attn.o_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.self_attn.o_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.gate.weight": "model-00059-of-000163.safetensors", "model.layers.24.mlp.gate.e_score_correction_bias": "model-00059-of-000163.safetensors", "model.layers.24.mlp.shared_experts.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.shared_experts.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.shared_experts.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.shared_experts.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.shared_experts.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.0.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.0.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.0.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.0.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.0.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.0.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.1.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.1.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.1.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.1.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.1.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.1.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.2.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.2.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.2.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.2.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.2.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.2.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.3.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.3.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.3.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.3.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.3.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.3.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.4.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.4.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.4.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.4.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.4.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.4.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.5.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.5.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.5.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.5.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.5.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.5.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.6.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.6.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.6.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.6.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.6.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.6.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.7.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.7.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.7.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.7.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.7.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.7.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.8.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.8.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.8.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.8.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.8.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.8.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.9.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.9.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.9.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.9.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.9.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.9.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.10.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.10.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.10.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.10.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.10.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.10.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.11.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.11.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.11.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.11.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.11.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.11.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.12.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.12.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.12.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.12.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.12.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.12.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.13.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.13.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.13.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.13.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.13.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.13.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.14.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.14.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.14.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.14.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.14.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.14.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.15.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.15.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.15.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.15.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.15.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.15.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.16.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.16.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.16.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.16.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.16.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.16.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.17.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.17.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.17.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.17.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.17.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.17.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.18.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.18.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.18.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.18.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.18.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.18.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.19.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.19.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.19.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.19.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.19.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.19.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.20.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.20.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.20.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.20.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.20.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.20.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.21.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.21.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.21.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.21.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.21.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.21.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.22.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.22.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.22.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.22.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.22.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.22.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.23.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.23.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.23.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.23.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.23.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.23.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.24.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.24.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.24.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.24.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.24.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.24.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.25.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.25.gate_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.25.up_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.25.up_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.25.down_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.25.down_proj.weight_scale_inv": "model-00059-of-000163.safetensors", "model.layers.24.mlp.experts.26.gate_proj.weight": "model-00059-of-000163.safetensors", - "model.layers.24.mlp.experts.26.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.26.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.26.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.26.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.26.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.27.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.27.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.27.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.27.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.27.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.27.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.28.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.28.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.28.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.28.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.28.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.28.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.29.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.29.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.29.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.29.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.29.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.29.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.30.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.30.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.30.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.30.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.30.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.30.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.31.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.31.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.31.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.31.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.31.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.31.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.32.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.32.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.32.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.32.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.32.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.32.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.33.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.33.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.33.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.33.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.33.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.33.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.34.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.34.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.34.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.34.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.34.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.34.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.35.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.35.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.35.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.35.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.35.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.35.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.36.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.36.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.36.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.36.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.36.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.36.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.37.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.37.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.37.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.37.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.37.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.37.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.38.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.38.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.38.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.38.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.38.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.38.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.39.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.39.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.39.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.39.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.39.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.39.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.40.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.40.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.40.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.40.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.40.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.40.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.41.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.41.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.41.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.41.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.41.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.41.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.42.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.42.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.42.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.42.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.42.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.42.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.43.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.43.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.43.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.43.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.43.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.43.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.44.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.44.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.44.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.44.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.44.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.44.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.45.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.45.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.45.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.45.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.45.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.45.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.46.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.46.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.46.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.46.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.46.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.46.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.47.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.47.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.47.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.47.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.47.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.47.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.48.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.48.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.48.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.48.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.48.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.48.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.49.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.49.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.49.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.49.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.49.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.49.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.50.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.50.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.50.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.50.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.50.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.50.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.51.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.51.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.51.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.51.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.51.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.51.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.52.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.52.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.52.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.52.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.52.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.52.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.53.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.53.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.53.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.53.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.53.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.53.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.54.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.54.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.54.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.54.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.54.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.54.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.55.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.55.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.55.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.55.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.55.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.55.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.56.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.56.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.56.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.56.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.56.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.56.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.57.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.57.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.57.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.57.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.57.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.57.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.58.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.58.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.58.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.58.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.58.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.58.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.59.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.59.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.59.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.59.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.59.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.59.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.60.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.60.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.60.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.60.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.60.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.60.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.61.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.61.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.61.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.61.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.61.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.61.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.62.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.62.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.62.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.62.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.62.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.62.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.63.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.63.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.63.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.63.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.63.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.63.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.64.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.64.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.64.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.64.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.64.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.64.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.65.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.65.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.65.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.65.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.65.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.65.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.66.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.66.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.66.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.66.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.66.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.66.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.67.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.67.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.67.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.67.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.67.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.67.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.68.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.68.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.68.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.68.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.68.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.68.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.69.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.69.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.69.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.69.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.69.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.69.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.70.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.70.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.70.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.70.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.70.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.70.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.71.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.71.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.71.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.71.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.71.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.71.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.72.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.72.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.72.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.72.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.72.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.72.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.73.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.73.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.73.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.73.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.73.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.73.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.74.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.74.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.74.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.74.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.74.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.74.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.75.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.75.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.75.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.75.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.75.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.75.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.76.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.76.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.76.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.76.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.76.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.76.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.77.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.77.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.77.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.77.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.77.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.77.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.78.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.78.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.78.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.78.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.78.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.78.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.79.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.79.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.79.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.79.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.79.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.79.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.80.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.80.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.80.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.80.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.80.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.80.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.81.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.81.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.81.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.81.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.81.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.81.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.82.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.82.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.82.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.82.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.82.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.82.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.83.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.83.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.83.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.83.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.83.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.83.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.84.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.84.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.84.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.84.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.84.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.84.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.85.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.85.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.85.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.85.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.85.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.85.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.86.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.86.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.86.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.86.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.86.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.86.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.87.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.87.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.87.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.87.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.87.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.87.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.88.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.88.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.88.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.88.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.88.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.88.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.89.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.89.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.89.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.89.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.89.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.89.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.90.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.90.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.90.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.90.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.90.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.90.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.91.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.91.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.91.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.91.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.91.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.91.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.92.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.92.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.92.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.92.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.92.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.92.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.93.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.93.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.93.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.93.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.93.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.93.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.94.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.94.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.94.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.94.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.94.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.94.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.95.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.95.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.95.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.95.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.95.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.95.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.96.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.96.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.96.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.96.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.96.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.96.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.97.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.97.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.97.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.97.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.97.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.97.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.98.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.98.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.98.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.98.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.98.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.98.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.99.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.99.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.99.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.99.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.99.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.99.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.100.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.100.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.100.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.100.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.100.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.100.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.101.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.101.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.101.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.101.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.101.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.101.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.102.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.102.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.102.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.102.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.102.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.102.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.103.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.103.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.103.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.103.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.103.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.103.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.104.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.104.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.104.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.104.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.104.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.104.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.105.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.105.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.105.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.105.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.105.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.105.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.106.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.106.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.106.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.106.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.106.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.106.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.107.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.107.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.107.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.107.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.107.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.107.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.108.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.108.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.108.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.108.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.108.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.108.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.109.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.109.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.109.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.109.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.109.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.109.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.110.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.110.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.110.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.110.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.110.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.110.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.111.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.111.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.111.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.111.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.111.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.111.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.112.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.112.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.112.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.112.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.112.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.112.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.113.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.113.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.113.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.113.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.113.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.113.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.114.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.114.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.114.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.114.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.114.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.114.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.115.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.115.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.115.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.115.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.115.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.115.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.116.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.116.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.116.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.116.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.116.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.116.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.117.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.117.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.117.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.117.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.117.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.117.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.118.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.118.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.118.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.118.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.118.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.118.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.119.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.119.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.119.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.119.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.119.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.119.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.120.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.120.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.120.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.120.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.120.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.120.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.121.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.121.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.121.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.121.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.121.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.121.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.122.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.122.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.122.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.122.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.122.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.122.down_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.123.gate_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.123.gate_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.123.up_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.123.up_proj.weight_scale_inv": "model-00060-of-000163.safetensors", "model.layers.24.mlp.experts.123.down_proj.weight": "model-00060-of-000163.safetensors", - "model.layers.24.mlp.experts.123.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.124.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.124.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.124.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.124.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.124.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.124.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.125.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.125.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.125.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.125.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.125.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.125.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.126.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.126.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.126.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.126.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.126.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.126.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.127.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.127.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.127.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.127.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.127.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.127.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.128.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.128.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.128.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.128.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.128.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.128.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.129.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.129.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.129.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.129.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.129.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.129.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.130.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.130.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.130.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.130.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.130.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.130.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.131.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.131.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.131.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.131.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.131.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.131.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.132.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.132.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.132.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.132.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.132.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.132.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.133.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.133.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.133.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.133.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.133.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.133.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.134.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.134.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.134.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.134.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.134.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.134.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.135.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.135.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.135.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.135.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.135.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.135.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.136.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.136.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.136.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.136.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.136.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.136.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.137.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.137.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.137.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.137.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.137.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.137.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.138.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.138.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.138.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.138.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.138.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.138.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.139.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.139.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.139.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.139.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.139.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.139.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.140.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.140.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.140.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.140.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.140.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.140.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.141.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.141.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.141.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.141.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.141.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.141.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.142.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.142.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.142.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.142.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.142.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.142.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.143.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.143.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.143.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.143.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.143.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.143.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.144.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.144.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.144.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.144.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.144.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.144.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.145.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.145.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.145.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.145.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.145.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.145.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.146.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.146.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.146.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.146.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.146.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.146.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.147.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.147.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.147.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.147.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.147.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.147.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.148.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.148.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.148.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.148.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.148.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.148.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.149.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.149.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.149.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.149.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.149.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.149.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.150.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.150.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.150.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.150.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.150.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.150.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.151.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.151.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.151.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.151.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.151.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.151.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.152.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.152.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.152.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.152.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.152.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.152.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.153.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.153.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.153.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.153.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.153.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.153.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.154.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.154.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.154.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.154.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.154.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.154.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.155.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.155.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.155.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.155.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.155.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.155.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.156.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.156.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.156.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.156.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.156.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.156.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.157.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.157.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.157.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.157.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.157.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.157.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.158.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.158.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.158.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.158.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.158.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.158.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.159.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.159.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.159.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.159.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.159.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.159.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.160.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.160.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.160.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.160.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.160.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.160.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.161.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.161.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.161.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.161.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.161.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.161.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.162.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.162.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.162.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.162.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.162.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.162.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.163.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.163.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.163.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.163.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.163.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.163.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.164.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.164.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.164.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.164.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.164.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.164.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.165.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.165.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.165.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.165.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.165.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.165.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.166.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.166.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.166.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.166.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.166.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.166.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.167.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.167.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.167.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.167.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.167.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.167.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.168.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.168.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.168.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.168.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.168.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.168.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.169.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.169.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.169.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.169.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.169.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.169.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.170.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.170.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.170.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.170.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.170.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.170.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.171.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.171.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.171.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.171.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.171.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.171.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.172.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.172.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.172.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.172.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.172.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.172.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.173.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.173.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.173.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.173.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.173.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.173.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.174.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.174.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.174.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.174.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.174.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.174.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.175.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.175.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.175.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.175.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.175.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.175.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.176.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.176.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.176.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.176.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.176.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.176.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.177.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.177.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.177.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.177.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.177.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.177.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.178.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.178.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.178.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.178.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.178.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.178.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.179.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.179.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.179.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.179.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.179.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.179.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.180.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.180.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.180.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.180.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.180.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.180.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.181.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.181.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.181.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.181.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.181.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.181.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.182.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.182.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.182.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.182.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.182.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.182.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.183.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.183.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.183.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.183.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.183.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.183.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.184.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.184.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.184.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.184.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.184.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.184.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.185.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.185.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.185.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.185.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.185.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.185.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.186.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.186.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.186.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.186.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.186.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.186.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.187.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.187.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.187.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.187.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.187.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.187.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.188.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.188.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.188.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.188.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.188.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.188.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.189.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.189.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.189.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.189.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.189.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.189.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.190.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.190.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.190.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.190.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.190.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.190.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.191.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.191.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.191.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.191.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.191.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.191.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.192.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.192.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.192.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.192.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.192.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.192.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.193.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.193.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.193.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.193.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.193.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.193.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.194.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.194.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.194.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.194.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.194.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.194.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.195.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.195.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.195.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.195.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.195.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.195.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.196.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.196.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.196.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.196.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.196.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.196.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.197.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.197.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.197.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.197.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.197.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.197.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.198.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.198.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.198.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.198.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.198.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.198.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.199.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.199.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.199.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.199.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.199.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.199.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.200.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.200.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.200.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.200.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.200.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.200.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.201.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.201.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.201.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.201.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.201.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.201.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.202.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.202.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.202.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.202.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.202.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.202.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.203.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.203.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.203.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.203.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.203.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.203.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.204.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.204.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.204.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.204.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.204.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.204.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.205.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.205.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.205.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.205.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.205.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.205.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.206.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.206.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.206.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.206.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.206.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.206.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.207.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.207.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.207.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.207.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.207.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.207.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.208.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.208.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.208.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.208.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.208.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.208.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.209.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.209.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.209.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.209.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.209.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.209.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.210.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.210.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.210.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.210.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.210.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.210.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.211.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.211.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.211.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.211.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.211.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.211.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.212.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.212.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.212.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.212.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.212.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.212.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.213.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.213.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.213.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.213.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.213.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.213.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.214.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.214.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.214.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.214.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.214.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.214.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.215.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.215.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.215.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.215.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.215.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.215.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.216.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.216.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.216.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.216.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.216.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.216.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.217.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.217.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.217.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.217.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.217.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.217.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.218.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.218.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.218.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.218.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.218.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.218.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.219.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.219.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.219.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.219.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.219.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.219.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.220.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.220.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.220.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.220.up_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.220.down_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.220.down_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.221.gate_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.221.gate_proj.weight_scale_inv": "model-00061-of-000163.safetensors", "model.layers.24.mlp.experts.221.up_proj.weight": "model-00061-of-000163.safetensors", - "model.layers.24.mlp.experts.221.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.221.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.221.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.222.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.222.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.222.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.222.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.222.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.222.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.223.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.223.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.223.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.223.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.223.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.223.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.224.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.224.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.224.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.224.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.224.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.224.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.225.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.225.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.225.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.225.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.225.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.225.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.226.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.226.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.226.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.226.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.226.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.226.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.227.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.227.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.227.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.227.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.227.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.227.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.228.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.228.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.228.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.228.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.228.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.228.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.229.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.229.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.229.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.229.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.229.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.229.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.230.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.230.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.230.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.230.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.230.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.230.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.231.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.231.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.231.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.231.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.231.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.231.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.232.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.232.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.232.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.232.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.232.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.232.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.233.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.233.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.233.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.233.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.233.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.233.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.234.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.234.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.234.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.234.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.234.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.234.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.235.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.235.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.235.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.235.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.235.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.235.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.236.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.236.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.236.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.236.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.236.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.236.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.237.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.237.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.237.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.237.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.237.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.237.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.238.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.238.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.238.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.238.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.238.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.238.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.239.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.239.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.239.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.239.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.239.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.239.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.240.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.240.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.240.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.240.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.240.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.240.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.241.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.241.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.241.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.241.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.241.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.241.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.242.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.242.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.242.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.242.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.242.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.242.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.243.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.243.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.243.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.243.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.243.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.243.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.244.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.244.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.244.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.244.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.244.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.244.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.245.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.245.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.245.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.245.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.245.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.245.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.246.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.246.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.246.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.246.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.246.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.246.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.247.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.247.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.247.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.247.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.247.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.247.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.248.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.248.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.248.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.248.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.248.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.248.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.249.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.249.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.249.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.249.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.249.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.249.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.250.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.250.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.250.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.250.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.250.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.250.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.251.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.251.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.251.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.251.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.251.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.251.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.252.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.252.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.252.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.252.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.252.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.252.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.253.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.253.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.253.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.253.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.253.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.253.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.254.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.254.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.254.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.254.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.254.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.254.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.255.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.255.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.255.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.255.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.mlp.experts.255.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.24.mlp.experts.255.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.24.input_layernorm.weight": "model-00062-of-000163.safetensors", "model.layers.24.post_attention_layernorm.weight": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.q_a_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.self_attn.q_a_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.q_a_layernorm.weight": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.q_b_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.self_attn.q_b_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.kv_a_proj_with_mqa.weight": "model-00062-of-000163.safetensors", - "model.layers.25.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.kv_a_layernorm.weight": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.kv_b_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.self_attn.kv_b_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.self_attn.o_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.self_attn.o_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.gate.weight": "model-00062-of-000163.safetensors", "model.layers.25.mlp.gate.e_score_correction_bias": "model-00062-of-000163.safetensors", "model.layers.25.mlp.shared_experts.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.shared_experts.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.shared_experts.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.shared_experts.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.shared_experts.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.0.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.0.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.0.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.0.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.0.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.0.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.1.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.1.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.1.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.1.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.1.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.1.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.2.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.2.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.2.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.2.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.2.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.2.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.3.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.3.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.3.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.3.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.3.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.3.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.4.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.4.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.4.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.4.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.4.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.4.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.5.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.5.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.5.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.5.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.5.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.5.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.6.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.6.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.6.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.6.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.6.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.6.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.7.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.7.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.7.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.7.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.7.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.7.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.8.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.8.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.8.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.8.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.8.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.8.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.9.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.9.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.9.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.9.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.9.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.9.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.10.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.10.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.10.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.10.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.10.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.10.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.11.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.11.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.11.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.11.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.11.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.11.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.12.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.12.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.12.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.12.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.12.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.12.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.13.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.13.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.13.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.13.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.13.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.13.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.14.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.14.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.14.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.14.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.14.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.14.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.15.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.15.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.15.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.15.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.15.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.15.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.16.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.16.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.16.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.16.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.16.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.16.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.17.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.17.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.17.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.17.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.17.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.17.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.18.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.18.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.18.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.18.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.18.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.18.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.19.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.19.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.19.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.19.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.19.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.19.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.20.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.20.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.20.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.20.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.20.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.20.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.21.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.21.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.21.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.21.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.21.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.21.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.22.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.22.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.22.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.22.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.22.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.22.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.23.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.23.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.23.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.23.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.23.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.23.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.24.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.24.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.24.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.24.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.24.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.24.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.25.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.25.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.25.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.25.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.25.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.25.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.26.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.26.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.26.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.26.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.26.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.26.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.27.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.27.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.27.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.27.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.27.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.27.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.28.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.28.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.28.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.28.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.28.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.28.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.29.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.29.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.29.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.29.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.29.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.29.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.30.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.30.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.30.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.30.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.30.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.30.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.31.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.31.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.31.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.31.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.31.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.31.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.32.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.32.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.32.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.32.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.32.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.32.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.33.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.33.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.33.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.33.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.33.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.33.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.34.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.34.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.34.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.34.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.34.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.34.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.35.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.35.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.35.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.35.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.35.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.35.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.36.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.36.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.36.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.36.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.36.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.36.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.37.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.37.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.37.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.37.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.37.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.37.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.38.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.38.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.38.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.38.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.38.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.38.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.39.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.39.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.39.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.39.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.39.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.39.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.40.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.40.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.40.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.40.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.40.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.40.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.41.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.41.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.41.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.41.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.41.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.41.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.42.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.42.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.42.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.42.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.42.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.42.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.43.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.43.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.43.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.43.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.43.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.43.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.44.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.44.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.44.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.44.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.44.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.44.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.45.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.45.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.45.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.45.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.45.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.45.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.46.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.46.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.46.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.46.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.46.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.46.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.47.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.47.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.47.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.47.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.47.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.47.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.48.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.48.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.48.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.48.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.48.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.48.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.49.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.49.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.49.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.49.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.49.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.49.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.50.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.50.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.50.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.50.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.50.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.50.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.51.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.51.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.51.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.51.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.51.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.51.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.52.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.52.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.52.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.52.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.52.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.52.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.53.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.53.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.53.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.53.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.53.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.53.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.54.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.54.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.54.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.54.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.54.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.54.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.55.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.55.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.55.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.55.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.55.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.55.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.56.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.56.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.56.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.56.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.56.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.56.down_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.57.gate_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.57.gate_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.57.up_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.57.up_proj.weight_scale_inv": "model-00062-of-000163.safetensors", "model.layers.25.mlp.experts.57.down_proj.weight": "model-00062-of-000163.safetensors", - "model.layers.25.mlp.experts.57.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.58.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.58.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.58.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.58.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.58.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.58.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.59.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.59.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.59.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.59.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.59.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.59.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.60.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.60.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.60.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.60.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.60.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.60.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.61.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.61.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.61.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.61.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.61.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.61.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.62.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.62.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.62.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.62.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.62.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.62.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.63.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.63.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.63.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.63.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.63.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.63.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.64.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.64.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.64.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.64.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.64.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.64.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.65.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.65.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.65.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.65.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.65.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.65.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.66.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.66.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.66.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.66.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.66.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.66.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.67.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.67.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.67.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.67.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.67.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.67.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.68.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.68.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.68.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.68.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.68.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.68.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.69.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.69.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.69.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.69.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.69.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.69.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.70.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.70.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.70.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.70.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.70.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.70.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.71.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.71.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.71.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.71.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.71.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.71.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.72.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.72.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.72.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.72.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.72.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.72.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.73.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.73.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.73.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.73.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.73.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.73.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.74.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.74.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.74.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.74.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.74.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.74.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.75.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.75.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.75.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.75.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.75.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.75.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.76.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.76.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.76.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.76.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.76.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.76.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.77.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.77.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.77.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.77.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.77.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.77.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.78.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.78.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.78.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.78.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.78.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.78.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.79.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.79.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.79.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.79.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.79.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.79.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.80.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.80.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.80.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.80.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.80.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.80.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.81.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.81.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.81.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.81.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.81.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.81.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.82.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.82.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.82.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.82.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.82.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.82.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.83.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.83.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.83.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.83.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.83.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.83.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.84.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.84.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.84.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.84.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.84.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.84.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.85.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.85.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.85.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.85.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.85.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.85.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.86.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.86.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.86.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.86.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.86.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.86.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.87.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.87.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.87.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.87.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.87.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.87.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.88.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.88.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.88.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.88.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.88.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.88.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.89.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.89.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.89.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.89.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.89.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.89.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.90.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.90.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.90.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.90.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.90.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.90.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.91.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.91.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.91.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.91.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.91.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.91.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.92.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.92.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.92.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.92.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.92.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.92.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.93.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.93.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.93.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.93.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.93.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.93.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.94.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.94.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.94.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.94.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.94.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.94.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.95.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.95.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.95.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.95.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.95.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.95.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.96.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.96.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.96.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.96.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.96.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.96.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.97.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.97.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.97.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.97.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.97.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.97.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.98.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.98.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.98.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.98.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.98.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.98.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.99.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.99.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.99.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.99.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.99.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.99.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.100.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.100.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.100.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.100.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.100.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.100.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.101.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.101.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.101.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.101.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.101.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.101.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.102.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.102.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.102.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.102.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.102.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.102.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.103.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.103.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.103.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.103.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.103.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.103.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.104.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.104.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.104.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.104.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.104.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.104.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.105.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.105.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.105.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.105.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.105.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.105.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.106.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.106.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.106.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.106.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.106.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.106.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.107.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.107.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.107.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.107.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.107.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.107.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.108.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.108.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.108.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.108.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.108.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.108.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.109.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.109.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.109.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.109.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.109.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.109.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.110.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.110.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.110.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.110.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.110.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.110.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.111.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.111.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.111.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.111.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.111.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.111.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.112.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.112.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.112.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.112.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.112.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.112.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.113.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.113.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.113.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.113.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.113.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.113.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.114.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.114.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.114.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.114.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.114.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.114.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.115.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.115.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.115.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.115.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.115.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.115.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.116.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.116.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.116.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.116.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.116.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.116.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.117.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.117.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.117.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.117.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.117.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.117.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.118.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.118.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.118.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.118.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.118.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.118.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.119.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.119.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.119.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.119.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.119.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.119.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.120.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.120.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.120.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.120.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.120.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.120.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.121.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.121.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.121.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.121.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.121.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.121.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.122.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.122.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.122.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.122.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.122.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.122.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.123.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.123.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.123.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.123.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.123.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.123.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.124.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.124.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.124.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.124.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.124.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.124.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.125.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.125.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.125.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.125.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.125.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.125.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.126.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.126.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.126.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.126.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.126.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.126.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.127.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.127.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.127.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.127.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.127.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.127.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.128.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.128.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.128.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.128.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.128.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.128.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.129.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.129.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.129.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.129.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.129.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.129.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.130.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.130.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.130.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.130.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.130.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.130.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.131.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.131.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.131.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.131.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.131.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.131.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.132.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.132.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.132.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.132.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.132.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.132.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.133.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.133.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.133.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.133.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.133.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.133.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.134.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.134.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.134.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.134.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.134.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.134.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.135.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.135.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.135.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.135.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.135.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.135.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.136.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.136.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.136.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.136.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.136.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.136.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.137.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.137.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.137.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.137.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.137.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.137.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.138.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.138.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.138.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.138.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.138.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.138.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.139.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.139.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.139.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.139.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.139.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.139.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.140.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.140.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.140.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.140.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.140.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.140.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.141.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.141.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.141.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.141.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.141.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.141.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.142.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.142.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.142.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.142.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.142.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.142.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.143.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.143.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.143.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.143.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.143.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.143.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.144.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.144.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.144.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.144.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.144.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.144.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.145.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.145.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.145.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.145.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.145.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.145.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.146.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.146.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.146.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.146.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.146.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.146.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.147.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.147.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.147.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.147.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.147.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.147.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.148.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.148.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.148.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.148.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.148.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.148.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.149.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.149.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.149.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.149.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.149.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.149.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.150.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.150.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.150.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.150.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.150.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.150.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.151.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.151.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.151.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.151.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.151.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.151.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.152.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.152.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.152.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.152.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.152.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.152.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.153.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.153.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.153.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.153.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.153.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.153.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.154.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.154.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.154.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.154.up_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.154.down_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.154.down_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.155.gate_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.155.gate_proj.weight_scale_inv": "model-00063-of-000163.safetensors", "model.layers.25.mlp.experts.155.up_proj.weight": "model-00063-of-000163.safetensors", - "model.layers.25.mlp.experts.155.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.155.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.155.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.156.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.156.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.156.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.156.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.156.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.156.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.157.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.157.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.157.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.157.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.157.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.157.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.158.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.158.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.158.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.158.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.158.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.158.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.159.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.159.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.159.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.159.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.159.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.159.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.160.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.160.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.160.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.160.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.160.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.160.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.161.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.161.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.161.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.161.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.161.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.161.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.162.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.162.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.162.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.162.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.162.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.162.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.163.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.163.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.163.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.163.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.163.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.163.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.164.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.164.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.164.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.164.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.164.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.164.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.165.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.165.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.165.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.165.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.165.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.165.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.166.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.166.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.166.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.166.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.166.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.166.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.167.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.167.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.167.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.167.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.167.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.167.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.168.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.168.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.168.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.168.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.168.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.168.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.169.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.169.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.169.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.169.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.169.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.169.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.170.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.170.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.170.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.170.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.170.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.170.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.171.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.171.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.171.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.171.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.171.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.171.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.172.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.172.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.172.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.172.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.172.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.172.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.173.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.173.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.173.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.173.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.173.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.173.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.174.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.174.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.174.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.174.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.174.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.174.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.175.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.175.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.175.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.175.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.175.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.175.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.176.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.176.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.176.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.176.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.176.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.176.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.177.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.177.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.177.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.177.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.177.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.177.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.178.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.178.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.178.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.178.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.178.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.178.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.179.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.179.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.179.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.179.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.179.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.179.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.180.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.180.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.180.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.180.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.180.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.180.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.181.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.181.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.181.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.181.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.181.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.181.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.182.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.182.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.182.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.182.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.182.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.182.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.183.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.183.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.183.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.183.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.183.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.183.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.184.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.184.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.184.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.184.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.184.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.184.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.185.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.185.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.185.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.185.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.185.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.185.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.186.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.186.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.186.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.186.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.186.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.186.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.187.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.187.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.187.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.187.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.187.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.187.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.188.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.188.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.188.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.188.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.188.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.188.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.189.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.189.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.189.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.189.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.189.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.189.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.190.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.190.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.190.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.190.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.190.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.190.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.191.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.191.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.191.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.191.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.191.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.191.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.192.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.192.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.192.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.192.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.192.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.192.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.193.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.193.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.193.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.193.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.193.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.193.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.194.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.194.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.194.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.194.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.194.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.194.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.195.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.195.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.195.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.195.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.195.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.195.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.196.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.196.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.196.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.196.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.196.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.196.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.197.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.197.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.197.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.197.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.197.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.197.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.198.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.198.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.198.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.198.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.198.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.198.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.199.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.199.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.199.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.199.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.199.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.199.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.200.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.200.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.200.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.200.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.200.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.200.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.201.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.201.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.201.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.201.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.201.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.201.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.202.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.202.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.202.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.202.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.202.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.202.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.203.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.203.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.203.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.203.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.203.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.203.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.204.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.204.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.204.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.204.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.204.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.204.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.205.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.205.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.205.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.205.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.205.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.205.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.206.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.206.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.206.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.206.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.206.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.206.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.207.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.207.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.207.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.207.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.207.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.207.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.208.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.208.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.208.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.208.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.208.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.208.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.209.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.209.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.209.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.209.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.209.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.209.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.210.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.210.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.210.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.210.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.210.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.210.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.211.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.211.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.211.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.211.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.211.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.211.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.212.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.212.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.212.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.212.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.212.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.212.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.213.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.213.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.213.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.213.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.213.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.213.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.214.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.214.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.214.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.214.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.214.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.214.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.215.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.215.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.215.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.215.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.215.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.215.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.216.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.216.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.216.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.216.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.216.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.216.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.217.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.217.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.217.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.217.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.217.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.217.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.218.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.218.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.218.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.218.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.218.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.218.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.219.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.219.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.219.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.219.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.219.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.219.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.220.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.220.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.220.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.220.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.220.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.220.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.221.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.221.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.221.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.221.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.221.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.221.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.222.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.222.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.222.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.222.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.222.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.222.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.223.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.223.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.223.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.223.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.223.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.223.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.224.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.224.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.224.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.224.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.224.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.224.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.225.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.225.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.225.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.225.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.225.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.225.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.226.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.226.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.226.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.226.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.226.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.226.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.227.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.227.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.227.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.227.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.227.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.227.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.228.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.228.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.228.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.228.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.228.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.228.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.229.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.229.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.229.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.229.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.229.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.229.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.230.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.230.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.230.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.230.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.230.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.230.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.231.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.231.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.231.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.231.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.231.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.231.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.232.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.232.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.232.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.232.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.232.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.232.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.233.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.233.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.233.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.233.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.233.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.233.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.234.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.234.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.234.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.234.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.234.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.234.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.235.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.235.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.235.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.235.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.235.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.235.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.236.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.236.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.236.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.236.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.236.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.236.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.237.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.237.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.237.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.237.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.237.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.237.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.238.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.238.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.238.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.238.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.238.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.238.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.239.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.239.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.239.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.239.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.239.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.239.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.240.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.240.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.240.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.240.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.240.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.240.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.241.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.241.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.241.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.241.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.241.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.241.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.242.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.242.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.242.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.242.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.242.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.242.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.243.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.243.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.243.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.243.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.243.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.243.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.244.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.244.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.244.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.244.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.244.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.244.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.245.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.245.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.245.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.245.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.245.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.245.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.246.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.246.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.246.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.246.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.246.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.246.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.247.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.247.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.247.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.247.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.247.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.247.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.248.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.248.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.248.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.248.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.248.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.248.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.249.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.249.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.249.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.249.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.249.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.249.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.250.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.250.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.250.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.250.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.250.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.250.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.251.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.251.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.251.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.251.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.251.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.251.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.252.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.252.gate_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.252.up_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.252.up_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.252.down_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.252.down_proj.weight_scale_inv": "model-00064-of-000163.safetensors", "model.layers.25.mlp.experts.253.gate_proj.weight": "model-00064-of-000163.safetensors", - "model.layers.25.mlp.experts.253.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.253.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.253.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.253.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.253.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.254.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.254.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.254.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.254.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.254.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.254.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.255.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.255.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.255.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.255.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.mlp.experts.255.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.25.mlp.experts.255.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.25.input_layernorm.weight": "model-00065-of-000163.safetensors", "model.layers.25.post_attention_layernorm.weight": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.q_a_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.self_attn.q_a_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.q_a_layernorm.weight": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.q_b_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.self_attn.q_b_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.kv_a_proj_with_mqa.weight": "model-00065-of-000163.safetensors", - "model.layers.26.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.kv_a_layernorm.weight": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.kv_b_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.self_attn.kv_b_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.self_attn.o_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.self_attn.o_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.gate.weight": "model-00065-of-000163.safetensors", "model.layers.26.mlp.gate.e_score_correction_bias": "model-00065-of-000163.safetensors", "model.layers.26.mlp.shared_experts.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.shared_experts.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.shared_experts.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.shared_experts.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.shared_experts.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.0.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.0.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.0.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.0.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.0.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.0.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.1.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.1.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.1.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.1.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.1.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.1.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.2.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.2.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.2.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.2.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.2.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.2.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.3.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.3.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.3.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.3.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.3.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.3.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.4.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.4.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.4.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.4.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.4.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.4.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.5.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.5.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.5.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.5.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.5.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.5.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.6.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.6.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.6.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.6.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.6.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.6.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.7.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.7.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.7.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.7.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.7.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.7.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.8.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.8.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.8.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.8.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.8.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.8.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.9.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.9.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.9.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.9.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.9.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.9.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.10.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.10.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.10.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.10.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.10.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.10.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.11.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.11.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.11.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.11.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.11.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.11.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.12.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.12.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.12.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.12.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.12.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.12.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.13.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.13.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.13.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.13.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.13.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.13.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.14.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.14.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.14.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.14.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.14.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.14.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.15.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.15.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.15.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.15.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.15.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.15.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.16.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.16.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.16.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.16.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.16.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.16.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.17.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.17.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.17.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.17.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.17.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.17.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.18.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.18.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.18.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.18.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.18.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.18.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.19.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.19.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.19.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.19.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.19.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.19.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.20.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.20.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.20.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.20.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.20.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.20.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.21.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.21.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.21.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.21.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.21.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.21.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.22.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.22.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.22.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.22.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.22.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.22.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.23.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.23.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.23.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.23.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.23.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.23.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.24.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.24.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.24.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.24.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.24.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.24.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.25.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.25.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.25.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.25.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.25.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.25.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.26.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.26.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.26.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.26.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.26.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.26.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.27.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.27.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.27.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.27.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.27.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.27.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.28.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.28.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.28.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.28.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.28.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.28.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.29.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.29.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.29.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.29.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.29.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.29.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.30.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.30.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.30.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.30.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.30.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.30.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.31.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.31.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.31.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.31.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.31.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.31.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.32.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.32.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.32.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.32.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.32.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.32.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.33.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.33.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.33.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.33.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.33.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.33.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.34.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.34.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.34.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.34.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.34.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.34.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.35.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.35.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.35.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.35.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.35.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.35.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.36.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.36.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.36.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.36.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.36.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.36.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.37.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.37.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.37.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.37.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.37.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.37.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.38.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.38.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.38.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.38.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.38.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.38.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.39.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.39.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.39.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.39.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.39.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.39.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.40.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.40.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.40.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.40.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.40.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.40.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.41.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.41.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.41.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.41.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.41.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.41.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.42.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.42.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.42.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.42.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.42.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.42.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.43.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.43.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.43.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.43.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.43.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.43.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.44.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.44.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.44.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.44.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.44.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.44.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.45.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.45.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.45.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.45.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.45.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.45.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.46.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.46.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.46.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.46.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.46.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.46.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.47.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.47.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.47.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.47.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.47.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.47.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.48.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.48.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.48.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.48.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.48.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.48.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.49.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.49.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.49.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.49.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.49.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.49.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.50.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.50.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.50.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.50.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.50.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.50.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.51.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.51.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.51.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.51.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.51.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.51.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.52.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.52.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.52.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.52.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.52.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.52.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.53.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.53.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.53.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.53.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.53.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.53.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.54.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.54.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.54.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.54.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.54.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.54.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.55.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.55.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.55.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.55.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.55.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.55.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.56.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.56.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.56.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.56.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.56.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.56.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.57.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.57.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.57.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.57.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.57.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.57.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.58.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.58.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.58.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.58.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.58.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.58.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.59.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.59.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.59.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.59.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.59.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.59.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.60.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.60.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.60.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.60.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.60.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.60.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.61.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.61.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.61.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.61.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.61.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.61.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.62.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.62.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.62.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.62.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.62.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.62.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.63.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.63.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.63.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.63.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.63.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.63.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.64.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.64.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.64.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.64.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.64.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.64.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.65.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.65.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.65.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.65.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.65.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.65.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.66.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.66.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.66.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.66.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.66.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.66.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.67.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.67.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.67.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.67.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.67.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.67.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.68.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.68.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.68.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.68.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.68.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.68.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.69.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.69.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.69.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.69.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.69.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.69.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.70.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.70.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.70.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.70.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.70.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.70.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.71.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.71.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.71.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.71.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.71.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.71.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.72.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.72.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.72.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.72.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.72.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.72.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.73.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.73.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.73.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.73.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.73.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.73.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.74.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.74.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.74.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.74.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.74.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.74.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.75.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.75.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.75.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.75.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.75.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.75.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.76.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.76.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.76.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.76.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.76.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.76.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.77.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.77.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.77.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.77.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.77.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.77.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.78.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.78.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.78.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.78.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.78.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.78.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.79.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.79.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.79.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.79.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.79.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.79.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.80.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.80.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.80.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.80.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.80.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.80.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.81.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.81.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.81.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.81.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.81.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.81.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.82.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.82.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.82.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.82.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.82.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.82.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.83.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.83.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.83.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.83.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.83.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.83.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.84.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.84.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.84.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.84.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.84.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.84.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.85.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.85.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.85.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.85.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.85.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.85.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.86.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.86.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.86.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.86.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.86.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.86.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.87.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.87.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.87.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.87.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.87.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.87.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.88.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.88.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.88.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.88.up_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.88.down_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.88.down_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.89.gate_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.89.gate_proj.weight_scale_inv": "model-00065-of-000163.safetensors", "model.layers.26.mlp.experts.89.up_proj.weight": "model-00065-of-000163.safetensors", - "model.layers.26.mlp.experts.89.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.89.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.89.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.90.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.90.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.90.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.90.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.90.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.90.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.91.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.91.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.91.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.91.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.91.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.91.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.92.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.92.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.92.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.92.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.92.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.92.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.93.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.93.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.93.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.93.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.93.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.93.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.94.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.94.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.94.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.94.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.94.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.94.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.95.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.95.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.95.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.95.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.95.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.95.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.96.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.96.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.96.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.96.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.96.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.96.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.97.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.97.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.97.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.97.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.97.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.97.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.98.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.98.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.98.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.98.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.98.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.98.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.99.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.99.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.99.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.99.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.99.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.99.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.100.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.100.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.100.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.100.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.100.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.100.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.101.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.101.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.101.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.101.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.101.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.101.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.102.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.102.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.102.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.102.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.102.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.102.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.103.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.103.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.103.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.103.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.103.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.103.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.104.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.104.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.104.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.104.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.104.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.104.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.105.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.105.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.105.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.105.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.105.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.105.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.106.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.106.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.106.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.106.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.106.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.106.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.107.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.107.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.107.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.107.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.107.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.107.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.108.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.108.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.108.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.108.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.108.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.108.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.109.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.109.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.109.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.109.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.109.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.109.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.110.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.110.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.110.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.110.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.110.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.110.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.111.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.111.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.111.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.111.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.111.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.111.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.112.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.112.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.112.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.112.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.112.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.112.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.113.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.113.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.113.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.113.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.113.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.113.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.114.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.114.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.114.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.114.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.114.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.114.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.115.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.115.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.115.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.115.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.115.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.115.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.116.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.116.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.116.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.116.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.116.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.116.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.117.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.117.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.117.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.117.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.117.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.117.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.118.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.118.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.118.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.118.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.118.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.118.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.119.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.119.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.119.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.119.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.119.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.119.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.120.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.120.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.120.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.120.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.120.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.120.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.121.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.121.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.121.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.121.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.121.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.121.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.122.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.122.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.122.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.122.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.122.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.122.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.123.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.123.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.123.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.123.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.123.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.123.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.124.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.124.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.124.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.124.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.124.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.124.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.125.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.125.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.125.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.125.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.125.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.125.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.126.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.126.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.126.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.126.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.126.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.126.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.127.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.127.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.127.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.127.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.127.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.127.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.128.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.128.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.128.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.128.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.128.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.128.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.129.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.129.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.129.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.129.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.129.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.129.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.130.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.130.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.130.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.130.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.130.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.130.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.131.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.131.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.131.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.131.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.131.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.131.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.132.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.132.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.132.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.132.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.132.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.132.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.133.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.133.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.133.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.133.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.133.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.133.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.134.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.134.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.134.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.134.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.134.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.134.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.135.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.135.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.135.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.135.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.135.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.135.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.136.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.136.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.136.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.136.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.136.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.136.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.137.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.137.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.137.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.137.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.137.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.137.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.138.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.138.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.138.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.138.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.138.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.138.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.139.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.139.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.139.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.139.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.139.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.139.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.140.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.140.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.140.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.140.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.140.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.140.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.141.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.141.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.141.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.141.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.141.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.141.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.142.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.142.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.142.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.142.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.142.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.142.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.143.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.143.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.143.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.143.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.143.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.143.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.144.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.144.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.144.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.144.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.144.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.144.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.145.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.145.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.145.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.145.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.145.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.145.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.146.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.146.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.146.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.146.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.146.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.146.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.147.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.147.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.147.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.147.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.147.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.147.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.148.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.148.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.148.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.148.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.148.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.148.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.149.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.149.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.149.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.149.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.149.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.149.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.150.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.150.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.150.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.150.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.150.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.150.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.151.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.151.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.151.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.151.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.151.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.151.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.152.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.152.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.152.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.152.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.152.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.152.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.153.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.153.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.153.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.153.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.153.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.153.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.154.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.154.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.154.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.154.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.154.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.154.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.155.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.155.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.155.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.155.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.155.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.155.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.156.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.156.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.156.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.156.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.156.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.156.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.157.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.157.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.157.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.157.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.157.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.157.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.158.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.158.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.158.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.158.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.158.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.158.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.159.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.159.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.159.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.159.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.159.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.159.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.160.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.160.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.160.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.160.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.160.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.160.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.161.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.161.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.161.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.161.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.161.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.161.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.162.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.162.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.162.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.162.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.162.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.162.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.163.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.163.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.163.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.163.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.163.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.163.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.164.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.164.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.164.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.164.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.164.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.164.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.165.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.165.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.165.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.165.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.165.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.165.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.166.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.166.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.166.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.166.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.166.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.166.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.167.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.167.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.167.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.167.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.167.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.167.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.168.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.168.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.168.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.168.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.168.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.168.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.169.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.169.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.169.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.169.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.169.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.169.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.170.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.170.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.170.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.170.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.170.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.170.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.171.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.171.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.171.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.171.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.171.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.171.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.172.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.172.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.172.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.172.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.172.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.172.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.173.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.173.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.173.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.173.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.173.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.173.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.174.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.174.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.174.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.174.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.174.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.174.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.175.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.175.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.175.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.175.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.175.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.175.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.176.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.176.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.176.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.176.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.176.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.176.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.177.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.177.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.177.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.177.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.177.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.177.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.178.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.178.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.178.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.178.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.178.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.178.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.179.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.179.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.179.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.179.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.179.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.179.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.180.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.180.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.180.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.180.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.180.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.180.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.181.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.181.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.181.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.181.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.181.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.181.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.182.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.182.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.182.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.182.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.182.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.182.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.183.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.183.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.183.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.183.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.183.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.183.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.184.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.184.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.184.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.184.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.184.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.184.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.185.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.185.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.185.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.185.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.185.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.185.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.186.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.186.gate_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.186.up_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.186.up_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.186.down_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.186.down_proj.weight_scale_inv": "model-00066-of-000163.safetensors", "model.layers.26.mlp.experts.187.gate_proj.weight": "model-00066-of-000163.safetensors", - "model.layers.26.mlp.experts.187.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.187.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.187.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.187.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.187.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.188.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.188.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.188.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.188.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.188.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.188.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.189.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.189.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.189.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.189.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.189.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.189.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.190.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.190.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.190.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.190.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.190.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.190.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.191.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.191.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.191.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.191.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.191.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.191.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.192.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.192.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.192.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.192.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.192.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.192.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.193.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.193.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.193.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.193.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.193.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.193.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.194.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.194.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.194.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.194.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.194.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.194.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.195.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.195.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.195.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.195.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.195.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.195.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.196.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.196.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.196.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.196.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.196.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.196.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.197.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.197.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.197.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.197.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.197.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.197.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.198.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.198.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.198.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.198.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.198.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.198.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.199.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.199.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.199.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.199.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.199.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.199.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.200.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.200.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.200.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.200.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.200.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.200.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.201.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.201.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.201.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.201.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.201.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.201.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.202.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.202.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.202.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.202.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.202.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.202.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.203.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.203.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.203.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.203.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.203.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.203.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.204.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.204.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.204.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.204.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.204.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.204.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.205.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.205.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.205.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.205.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.205.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.205.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.206.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.206.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.206.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.206.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.206.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.206.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.207.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.207.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.207.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.207.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.207.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.207.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.208.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.208.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.208.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.208.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.208.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.208.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.209.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.209.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.209.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.209.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.209.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.209.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.210.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.210.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.210.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.210.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.210.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.210.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.211.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.211.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.211.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.211.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.211.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.211.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.212.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.212.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.212.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.212.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.212.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.212.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.213.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.213.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.213.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.213.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.213.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.213.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.214.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.214.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.214.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.214.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.214.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.214.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.215.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.215.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.215.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.215.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.215.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.215.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.216.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.216.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.216.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.216.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.216.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.216.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.217.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.217.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.217.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.217.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.217.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.217.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.218.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.218.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.218.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.218.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.218.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.218.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.219.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.219.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.219.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.219.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.219.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.219.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.220.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.220.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.220.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.220.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.220.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.220.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.221.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.221.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.221.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.221.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.221.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.221.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.222.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.222.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.222.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.222.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.222.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.222.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.223.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.223.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.223.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.223.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.223.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.223.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.224.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.224.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.224.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.224.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.224.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.224.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.225.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.225.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.225.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.225.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.225.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.225.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.226.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.226.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.226.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.226.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.226.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.226.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.227.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.227.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.227.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.227.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.227.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.227.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.228.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.228.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.228.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.228.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.228.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.228.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.229.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.229.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.229.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.229.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.229.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.229.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.230.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.230.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.230.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.230.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.230.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.230.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.231.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.231.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.231.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.231.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.231.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.231.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.232.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.232.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.232.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.232.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.232.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.232.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.233.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.233.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.233.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.233.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.233.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.233.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.234.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.234.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.234.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.234.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.234.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.234.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.235.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.235.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.235.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.235.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.235.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.235.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.236.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.236.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.236.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.236.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.236.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.236.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.237.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.237.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.237.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.237.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.237.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.237.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.238.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.238.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.238.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.238.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.238.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.238.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.239.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.239.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.239.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.239.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.239.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.239.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.240.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.240.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.240.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.240.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.240.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.240.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.241.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.241.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.241.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.241.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.241.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.241.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.242.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.242.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.242.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.242.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.242.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.242.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.243.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.243.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.243.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.243.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.243.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.243.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.244.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.244.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.244.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.244.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.244.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.244.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.245.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.245.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.245.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.245.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.245.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.245.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.246.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.246.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.246.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.246.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.246.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.246.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.247.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.247.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.247.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.247.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.247.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.247.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.248.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.248.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.248.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.248.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.248.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.248.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.249.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.249.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.249.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.249.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.249.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.249.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.250.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.250.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.250.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.250.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.250.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.250.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.251.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.251.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.251.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.251.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.251.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.251.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.252.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.252.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.252.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.252.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.252.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.252.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.253.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.253.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.253.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.253.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.253.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.253.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.254.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.254.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.254.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.254.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.254.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.254.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.255.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.255.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.255.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.255.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.mlp.experts.255.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.26.mlp.experts.255.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.26.input_layernorm.weight": "model-00067-of-000163.safetensors", "model.layers.26.post_attention_layernorm.weight": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.q_a_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.self_attn.q_a_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.q_a_layernorm.weight": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.q_b_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.self_attn.q_b_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.kv_a_proj_with_mqa.weight": "model-00067-of-000163.safetensors", - "model.layers.27.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.kv_a_layernorm.weight": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.kv_b_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.self_attn.kv_b_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.self_attn.o_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.self_attn.o_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.gate.weight": "model-00067-of-000163.safetensors", "model.layers.27.mlp.gate.e_score_correction_bias": "model-00067-of-000163.safetensors", "model.layers.27.mlp.shared_experts.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.shared_experts.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.shared_experts.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.shared_experts.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.shared_experts.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.0.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.0.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.0.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.0.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.0.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.0.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.1.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.1.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.1.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.1.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.1.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.1.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.2.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.2.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.2.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.2.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.2.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.2.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.3.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.3.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.3.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.3.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.3.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.3.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.4.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.4.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.4.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.4.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.4.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.4.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.5.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.5.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.5.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.5.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.5.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.5.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.6.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.6.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.6.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.6.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.6.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.6.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.7.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.7.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.7.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.7.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.7.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.7.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.8.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.8.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.8.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.8.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.8.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.8.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.9.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.9.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.9.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.9.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.9.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.9.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.10.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.10.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.10.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.10.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.10.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.10.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.11.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.11.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.11.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.11.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.11.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.11.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.12.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.12.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.12.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.12.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.12.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.12.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.13.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.13.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.13.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.13.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.13.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.13.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.14.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.14.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.14.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.14.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.14.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.14.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.15.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.15.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.15.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.15.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.15.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.15.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.16.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.16.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.16.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.16.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.16.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.16.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.17.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.17.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.17.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.17.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.17.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.17.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.18.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.18.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.18.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.18.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.18.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.18.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.19.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.19.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.19.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.19.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.19.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.19.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.20.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.20.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.20.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.20.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.20.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.20.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.21.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.21.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.21.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.21.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.21.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.21.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.22.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.22.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.22.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.22.up_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.22.down_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.22.down_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.23.gate_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.23.gate_proj.weight_scale_inv": "model-00067-of-000163.safetensors", "model.layers.27.mlp.experts.23.up_proj.weight": "model-00067-of-000163.safetensors", - "model.layers.27.mlp.experts.23.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.23.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.23.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.24.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.24.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.24.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.24.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.24.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.24.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.25.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.25.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.25.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.25.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.25.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.25.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.26.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.26.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.26.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.26.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.26.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.26.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.27.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.27.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.27.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.27.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.27.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.27.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.28.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.28.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.28.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.28.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.28.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.28.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.29.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.29.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.29.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.29.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.29.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.29.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.30.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.30.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.30.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.30.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.30.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.30.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.31.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.31.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.31.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.31.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.31.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.31.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.32.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.32.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.32.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.32.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.32.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.32.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.33.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.33.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.33.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.33.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.33.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.33.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.34.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.34.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.34.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.34.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.34.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.34.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.35.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.35.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.35.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.35.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.35.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.35.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.36.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.36.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.36.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.36.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.36.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.36.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.37.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.37.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.37.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.37.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.37.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.37.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.38.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.38.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.38.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.38.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.38.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.38.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.39.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.39.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.39.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.39.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.39.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.39.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.40.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.40.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.40.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.40.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.40.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.40.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.41.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.41.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.41.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.41.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.41.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.41.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.42.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.42.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.42.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.42.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.42.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.42.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.43.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.43.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.43.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.43.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.43.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.43.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.44.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.44.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.44.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.44.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.44.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.44.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.45.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.45.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.45.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.45.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.45.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.45.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.46.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.46.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.46.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.46.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.46.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.46.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.47.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.47.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.47.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.47.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.47.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.47.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.48.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.48.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.48.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.48.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.48.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.48.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.49.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.49.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.49.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.49.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.49.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.49.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.50.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.50.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.50.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.50.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.50.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.50.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.51.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.51.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.51.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.51.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.51.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.51.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.52.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.52.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.52.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.52.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.52.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.52.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.53.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.53.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.53.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.53.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.53.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.53.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.54.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.54.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.54.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.54.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.54.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.54.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.55.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.55.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.55.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.55.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.55.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.55.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.56.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.56.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.56.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.56.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.56.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.56.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.57.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.57.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.57.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.57.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.57.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.57.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.58.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.58.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.58.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.58.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.58.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.58.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.59.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.59.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.59.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.59.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.59.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.59.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.60.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.60.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.60.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.60.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.60.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.60.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.61.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.61.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.61.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.61.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.61.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.61.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.62.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.62.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.62.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.62.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.62.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.62.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.63.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.63.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.63.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.63.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.63.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.63.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.64.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.64.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.64.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.64.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.64.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.64.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.65.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.65.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.65.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.65.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.65.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.65.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.66.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.66.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.66.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.66.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.66.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.66.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.67.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.67.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.67.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.67.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.67.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.67.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.68.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.68.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.68.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.68.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.68.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.68.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.69.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.69.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.69.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.69.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.69.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.69.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.70.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.70.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.70.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.70.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.70.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.70.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.71.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.71.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.71.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.71.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.71.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.71.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.72.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.72.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.72.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.72.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.72.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.72.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.73.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.73.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.73.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.73.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.73.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.73.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.74.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.74.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.74.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.74.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.74.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.74.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.75.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.75.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.75.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.75.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.75.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.75.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.76.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.76.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.76.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.76.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.76.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.76.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.77.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.77.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.77.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.77.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.77.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.77.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.78.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.78.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.78.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.78.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.78.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.78.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.79.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.79.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.79.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.79.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.79.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.79.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.80.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.80.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.80.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.80.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.80.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.80.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.81.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.81.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.81.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.81.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.81.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.81.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.82.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.82.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.82.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.82.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.82.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.82.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.83.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.83.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.83.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.83.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.83.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.83.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.84.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.84.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.84.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.84.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.84.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.84.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.85.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.85.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.85.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.85.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.85.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.85.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.86.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.86.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.86.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.86.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.86.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.86.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.87.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.87.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.87.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.87.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.87.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.87.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.88.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.88.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.88.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.88.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.88.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.88.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.89.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.89.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.89.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.89.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.89.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.89.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.90.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.90.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.90.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.90.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.90.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.90.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.91.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.91.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.91.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.91.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.91.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.91.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.92.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.92.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.92.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.92.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.92.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.92.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.93.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.93.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.93.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.93.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.93.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.93.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.94.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.94.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.94.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.94.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.94.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.94.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.95.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.95.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.95.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.95.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.95.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.95.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.96.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.96.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.96.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.96.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.96.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.96.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.97.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.97.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.97.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.97.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.97.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.97.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.98.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.98.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.98.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.98.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.98.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.98.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.99.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.99.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.99.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.99.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.99.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.99.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.100.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.100.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.100.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.100.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.100.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.100.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.101.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.101.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.101.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.101.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.101.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.101.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.102.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.102.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.102.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.102.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.102.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.102.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.103.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.103.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.103.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.103.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.103.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.103.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.104.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.104.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.104.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.104.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.104.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.104.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.105.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.105.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.105.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.105.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.105.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.105.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.106.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.106.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.106.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.106.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.106.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.106.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.107.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.107.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.107.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.107.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.107.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.107.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.108.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.108.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.108.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.108.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.108.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.108.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.109.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.109.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.109.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.109.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.109.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.109.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.110.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.110.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.110.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.110.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.110.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.110.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.111.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.111.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.111.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.111.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.111.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.111.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.112.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.112.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.112.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.112.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.112.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.112.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.113.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.113.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.113.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.113.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.113.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.113.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.114.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.114.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.114.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.114.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.114.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.114.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.115.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.115.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.115.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.115.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.115.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.115.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.116.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.116.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.116.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.116.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.116.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.116.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.117.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.117.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.117.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.117.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.117.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.117.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.118.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.118.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.118.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.118.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.118.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.118.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.119.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.119.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.119.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.119.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.119.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.119.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.120.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.120.gate_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.120.up_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.120.up_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.120.down_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.120.down_proj.weight_scale_inv": "model-00068-of-000163.safetensors", "model.layers.27.mlp.experts.121.gate_proj.weight": "model-00068-of-000163.safetensors", - "model.layers.27.mlp.experts.121.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.121.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.121.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.121.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.121.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.122.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.122.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.122.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.122.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.122.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.122.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.123.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.123.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.123.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.123.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.123.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.123.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.124.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.124.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.124.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.124.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.124.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.124.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.125.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.125.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.125.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.125.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.125.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.125.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.126.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.126.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.126.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.126.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.126.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.126.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.127.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.127.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.127.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.127.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.127.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.127.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.128.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.128.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.128.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.128.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.128.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.128.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.129.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.129.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.129.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.129.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.129.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.129.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.130.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.130.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.130.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.130.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.130.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.130.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.131.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.131.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.131.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.131.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.131.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.131.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.132.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.132.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.132.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.132.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.132.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.132.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.133.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.133.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.133.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.133.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.133.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.133.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.134.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.134.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.134.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.134.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.134.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.134.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.135.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.135.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.135.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.135.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.135.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.135.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.136.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.136.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.136.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.136.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.136.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.136.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.137.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.137.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.137.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.137.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.137.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.137.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.138.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.138.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.138.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.138.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.138.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.138.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.139.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.139.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.139.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.139.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.139.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.139.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.140.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.140.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.140.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.140.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.140.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.140.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.141.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.141.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.141.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.141.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.141.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.141.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.142.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.142.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.142.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.142.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.142.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.142.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.143.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.143.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.143.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.143.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.143.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.143.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.144.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.144.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.144.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.144.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.144.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.144.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.145.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.145.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.145.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.145.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.145.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.145.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.146.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.146.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.146.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.146.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.146.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.146.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.147.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.147.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.147.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.147.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.147.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.147.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.148.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.148.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.148.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.148.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.148.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.148.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.149.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.149.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.149.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.149.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.149.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.149.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.150.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.150.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.150.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.150.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.150.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.150.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.151.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.151.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.151.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.151.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.151.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.151.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.152.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.152.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.152.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.152.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.152.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.152.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.153.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.153.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.153.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.153.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.153.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.153.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.154.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.154.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.154.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.154.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.154.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.154.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.155.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.155.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.155.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.155.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.155.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.155.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.156.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.156.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.156.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.156.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.156.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.156.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.157.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.157.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.157.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.157.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.157.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.157.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.158.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.158.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.158.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.158.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.158.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.158.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.159.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.159.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.159.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.159.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.159.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.159.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.160.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.160.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.160.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.160.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.160.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.160.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.161.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.161.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.161.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.161.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.161.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.161.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.162.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.162.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.162.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.162.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.162.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.162.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.163.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.163.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.163.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.163.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.163.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.163.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.164.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.164.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.164.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.164.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.164.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.164.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.165.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.165.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.165.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.165.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.165.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.165.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.166.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.166.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.166.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.166.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.166.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.166.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.167.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.167.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.167.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.167.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.167.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.167.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.168.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.168.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.168.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.168.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.168.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.168.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.169.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.169.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.169.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.169.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.169.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.169.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.170.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.170.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.170.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.170.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.170.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.170.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.171.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.171.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.171.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.171.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.171.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.171.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.172.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.172.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.172.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.172.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.172.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.172.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.173.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.173.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.173.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.173.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.173.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.173.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.174.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.174.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.174.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.174.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.174.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.174.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.175.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.175.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.175.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.175.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.175.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.175.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.176.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.176.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.176.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.176.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.176.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.176.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.177.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.177.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.177.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.177.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.177.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.177.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.178.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.178.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.178.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.178.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.178.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.178.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.179.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.179.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.179.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.179.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.179.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.179.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.180.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.180.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.180.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.180.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.180.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.180.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.181.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.181.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.181.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.181.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.181.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.181.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.182.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.182.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.182.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.182.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.182.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.182.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.183.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.183.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.183.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.183.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.183.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.183.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.184.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.184.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.184.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.184.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.184.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.184.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.185.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.185.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.185.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.185.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.185.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.185.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.186.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.186.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.186.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.186.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.186.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.186.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.187.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.187.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.187.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.187.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.187.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.187.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.188.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.188.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.188.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.188.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.188.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.188.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.189.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.189.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.189.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.189.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.189.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.189.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.190.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.190.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.190.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.190.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.190.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.190.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.191.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.191.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.191.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.191.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.191.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.191.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.192.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.192.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.192.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.192.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.192.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.192.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.193.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.193.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.193.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.193.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.193.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.193.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.194.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.194.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.194.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.194.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.194.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.194.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.195.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.195.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.195.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.195.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.195.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.195.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.196.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.196.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.196.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.196.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.196.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.196.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.197.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.197.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.197.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.197.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.197.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.197.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.198.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.198.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.198.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.198.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.198.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.198.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.199.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.199.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.199.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.199.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.199.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.199.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.200.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.200.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.200.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.200.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.200.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.200.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.201.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.201.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.201.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.201.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.201.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.201.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.202.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.202.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.202.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.202.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.202.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.202.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.203.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.203.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.203.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.203.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.203.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.203.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.204.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.204.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.204.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.204.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.204.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.204.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.205.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.205.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.205.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.205.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.205.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.205.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.206.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.206.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.206.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.206.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.206.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.206.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.207.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.207.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.207.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.207.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.207.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.207.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.208.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.208.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.208.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.208.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.208.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.208.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.209.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.209.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.209.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.209.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.209.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.209.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.210.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.210.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.210.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.210.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.210.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.210.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.211.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.211.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.211.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.211.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.211.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.211.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.212.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.212.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.212.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.212.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.212.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.212.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.213.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.213.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.213.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.213.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.213.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.213.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.214.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.214.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.214.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.214.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.214.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.214.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.215.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.215.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.215.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.215.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.215.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.215.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.216.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.216.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.216.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.216.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.216.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.216.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.217.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.217.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.217.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.217.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.217.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.217.down_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.218.gate_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.218.gate_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.218.up_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.218.up_proj.weight_scale_inv": "model-00069-of-000163.safetensors", "model.layers.27.mlp.experts.218.down_proj.weight": "model-00069-of-000163.safetensors", - "model.layers.27.mlp.experts.218.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.219.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.219.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.219.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.219.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.219.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.219.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.220.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.220.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.220.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.220.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.220.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.220.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.221.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.221.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.221.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.221.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.221.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.221.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.222.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.222.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.222.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.222.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.222.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.222.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.223.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.223.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.223.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.223.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.223.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.223.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.224.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.224.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.224.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.224.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.224.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.224.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.225.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.225.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.225.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.225.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.225.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.225.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.226.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.226.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.226.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.226.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.226.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.226.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.227.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.227.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.227.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.227.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.227.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.227.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.228.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.228.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.228.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.228.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.228.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.228.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.229.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.229.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.229.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.229.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.229.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.229.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.230.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.230.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.230.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.230.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.230.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.230.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.231.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.231.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.231.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.231.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.231.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.231.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.232.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.232.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.232.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.232.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.232.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.232.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.233.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.233.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.233.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.233.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.233.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.233.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.234.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.234.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.234.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.234.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.234.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.234.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.235.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.235.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.235.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.235.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.235.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.235.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.236.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.236.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.236.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.236.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.236.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.236.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.237.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.237.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.237.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.237.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.237.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.237.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.238.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.238.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.238.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.238.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.238.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.238.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.239.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.239.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.239.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.239.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.239.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.239.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.240.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.240.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.240.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.240.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.240.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.240.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.241.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.241.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.241.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.241.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.241.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.241.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.242.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.242.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.242.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.242.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.242.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.242.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.243.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.243.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.243.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.243.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.243.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.243.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.244.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.244.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.244.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.244.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.244.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.244.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.245.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.245.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.245.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.245.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.245.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.245.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.246.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.246.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.246.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.246.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.246.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.246.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.247.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.247.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.247.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.247.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.247.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.247.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.248.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.248.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.248.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.248.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.248.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.248.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.249.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.249.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.249.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.249.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.249.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.249.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.250.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.250.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.250.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.250.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.250.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.250.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.251.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.251.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.251.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.251.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.251.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.251.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.252.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.252.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.252.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.252.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.252.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.252.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.253.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.253.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.253.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.253.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.253.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.253.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.254.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.254.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.254.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.254.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.254.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.254.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.255.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.255.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.255.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.255.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.mlp.experts.255.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.27.mlp.experts.255.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.27.input_layernorm.weight": "model-00070-of-000163.safetensors", "model.layers.27.post_attention_layernorm.weight": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.q_a_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.self_attn.q_a_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.q_a_layernorm.weight": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.q_b_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.self_attn.q_b_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.kv_a_proj_with_mqa.weight": "model-00070-of-000163.safetensors", - "model.layers.28.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.kv_a_layernorm.weight": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.kv_b_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.self_attn.kv_b_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.self_attn.o_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.self_attn.o_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.gate.weight": "model-00070-of-000163.safetensors", "model.layers.28.mlp.gate.e_score_correction_bias": "model-00070-of-000163.safetensors", "model.layers.28.mlp.shared_experts.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.shared_experts.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.shared_experts.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.shared_experts.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.shared_experts.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.0.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.0.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.0.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.0.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.0.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.0.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.1.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.1.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.1.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.1.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.1.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.1.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.2.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.2.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.2.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.2.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.2.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.2.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.3.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.3.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.3.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.3.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.3.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.3.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.4.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.4.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.4.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.4.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.4.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.4.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.5.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.5.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.5.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.5.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.5.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.5.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.6.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.6.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.6.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.6.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.6.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.6.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.7.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.7.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.7.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.7.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.7.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.7.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.8.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.8.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.8.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.8.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.8.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.8.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.9.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.9.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.9.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.9.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.9.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.9.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.10.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.10.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.10.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.10.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.10.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.10.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.11.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.11.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.11.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.11.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.11.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.11.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.12.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.12.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.12.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.12.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.12.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.12.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.13.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.13.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.13.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.13.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.13.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.13.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.14.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.14.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.14.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.14.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.14.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.14.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.15.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.15.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.15.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.15.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.15.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.15.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.16.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.16.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.16.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.16.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.16.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.16.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.17.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.17.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.17.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.17.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.17.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.17.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.18.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.18.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.18.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.18.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.18.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.18.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.19.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.19.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.19.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.19.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.19.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.19.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.20.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.20.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.20.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.20.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.20.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.20.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.21.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.21.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.21.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.21.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.21.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.21.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.22.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.22.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.22.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.22.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.22.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.22.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.23.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.23.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.23.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.23.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.23.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.23.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.24.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.24.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.24.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.24.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.24.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.24.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.25.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.25.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.25.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.25.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.25.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.25.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.26.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.26.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.26.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.26.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.26.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.26.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.27.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.27.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.27.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.27.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.27.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.27.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.28.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.28.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.28.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.28.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.28.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.28.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.29.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.29.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.29.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.29.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.29.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.29.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.30.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.30.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.30.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.30.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.30.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.30.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.31.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.31.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.31.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.31.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.31.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.31.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.32.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.32.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.32.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.32.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.32.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.32.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.33.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.33.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.33.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.33.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.33.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.33.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.34.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.34.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.34.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.34.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.34.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.34.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.35.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.35.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.35.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.35.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.35.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.35.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.36.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.36.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.36.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.36.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.36.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.36.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.37.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.37.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.37.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.37.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.37.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.37.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.38.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.38.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.38.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.38.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.38.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.38.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.39.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.39.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.39.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.39.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.39.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.39.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.40.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.40.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.40.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.40.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.40.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.40.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.41.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.41.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.41.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.41.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.41.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.41.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.42.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.42.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.42.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.42.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.42.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.42.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.43.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.43.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.43.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.43.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.43.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.43.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.44.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.44.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.44.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.44.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.44.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.44.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.45.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.45.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.45.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.45.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.45.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.45.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.46.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.46.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.46.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.46.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.46.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.46.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.47.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.47.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.47.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.47.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.47.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.47.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.48.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.48.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.48.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.48.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.48.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.48.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.49.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.49.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.49.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.49.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.49.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.49.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.50.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.50.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.50.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.50.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.50.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.50.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.51.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.51.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.51.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.51.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.51.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.51.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.52.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.52.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.52.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.52.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.52.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.52.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.53.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.53.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.53.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.53.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.53.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.53.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.54.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.54.gate_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.54.up_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.54.up_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.54.down_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.54.down_proj.weight_scale_inv": "model-00070-of-000163.safetensors", "model.layers.28.mlp.experts.55.gate_proj.weight": "model-00070-of-000163.safetensors", - "model.layers.28.mlp.experts.55.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.55.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.55.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.55.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.55.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.56.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.56.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.56.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.56.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.56.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.56.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.57.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.57.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.57.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.57.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.57.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.57.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.58.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.58.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.58.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.58.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.58.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.58.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.59.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.59.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.59.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.59.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.59.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.59.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.60.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.60.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.60.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.60.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.60.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.60.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.61.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.61.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.61.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.61.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.61.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.61.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.62.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.62.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.62.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.62.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.62.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.62.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.63.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.63.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.63.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.63.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.63.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.63.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.64.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.64.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.64.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.64.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.64.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.64.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.65.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.65.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.65.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.65.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.65.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.65.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.66.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.66.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.66.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.66.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.66.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.66.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.67.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.67.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.67.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.67.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.67.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.67.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.68.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.68.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.68.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.68.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.68.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.68.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.69.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.69.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.69.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.69.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.69.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.69.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.70.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.70.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.70.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.70.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.70.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.70.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.71.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.71.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.71.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.71.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.71.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.71.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.72.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.72.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.72.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.72.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.72.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.72.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.73.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.73.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.73.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.73.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.73.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.73.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.74.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.74.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.74.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.74.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.74.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.74.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.75.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.75.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.75.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.75.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.75.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.75.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.76.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.76.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.76.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.76.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.76.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.76.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.77.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.77.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.77.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.77.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.77.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.77.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.78.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.78.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.78.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.78.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.78.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.78.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.79.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.79.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.79.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.79.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.79.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.79.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.80.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.80.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.80.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.80.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.80.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.80.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.81.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.81.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.81.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.81.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.81.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.81.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.82.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.82.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.82.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.82.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.82.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.82.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.83.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.83.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.83.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.83.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.83.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.83.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.84.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.84.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.84.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.84.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.84.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.84.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.85.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.85.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.85.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.85.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.85.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.85.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.86.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.86.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.86.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.86.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.86.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.86.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.87.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.87.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.87.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.87.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.87.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.87.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.88.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.88.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.88.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.88.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.88.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.88.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.89.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.89.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.89.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.89.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.89.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.89.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.90.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.90.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.90.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.90.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.90.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.90.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.91.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.91.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.91.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.91.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.91.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.91.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.92.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.92.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.92.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.92.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.92.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.92.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.93.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.93.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.93.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.93.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.93.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.93.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.94.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.94.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.94.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.94.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.94.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.94.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.95.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.95.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.95.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.95.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.95.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.95.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.96.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.96.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.96.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.96.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.96.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.96.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.97.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.97.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.97.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.97.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.97.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.97.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.98.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.98.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.98.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.98.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.98.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.98.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.99.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.99.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.99.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.99.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.99.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.99.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.100.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.100.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.100.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.100.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.100.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.100.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.101.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.101.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.101.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.101.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.101.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.101.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.102.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.102.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.102.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.102.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.102.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.102.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.103.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.103.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.103.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.103.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.103.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.103.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.104.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.104.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.104.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.104.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.104.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.104.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.105.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.105.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.105.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.105.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.105.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.105.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.106.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.106.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.106.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.106.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.106.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.106.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.107.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.107.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.107.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.107.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.107.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.107.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.108.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.108.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.108.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.108.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.108.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.108.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.109.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.109.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.109.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.109.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.109.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.109.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.110.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.110.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.110.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.110.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.110.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.110.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.111.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.111.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.111.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.111.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.111.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.111.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.112.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.112.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.112.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.112.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.112.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.112.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.113.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.113.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.113.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.113.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.113.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.113.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.114.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.114.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.114.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.114.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.114.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.114.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.115.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.115.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.115.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.115.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.115.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.115.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.116.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.116.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.116.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.116.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.116.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.116.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.117.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.117.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.117.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.117.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.117.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.117.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.118.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.118.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.118.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.118.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.118.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.118.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.119.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.119.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.119.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.119.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.119.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.119.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.120.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.120.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.120.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.120.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.120.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.120.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.121.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.121.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.121.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.121.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.121.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.121.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.122.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.122.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.122.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.122.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.122.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.122.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.123.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.123.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.123.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.123.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.123.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.123.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.124.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.124.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.124.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.124.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.124.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.124.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.125.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.125.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.125.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.125.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.125.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.125.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.126.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.126.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.126.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.126.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.126.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.126.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.127.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.127.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.127.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.127.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.127.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.127.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.128.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.128.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.128.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.128.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.128.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.128.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.129.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.129.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.129.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.129.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.129.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.129.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.130.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.130.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.130.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.130.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.130.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.130.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.131.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.131.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.131.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.131.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.131.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.131.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.132.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.132.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.132.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.132.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.132.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.132.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.133.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.133.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.133.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.133.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.133.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.133.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.134.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.134.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.134.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.134.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.134.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.134.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.135.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.135.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.135.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.135.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.135.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.135.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.136.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.136.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.136.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.136.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.136.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.136.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.137.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.137.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.137.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.137.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.137.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.137.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.138.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.138.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.138.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.138.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.138.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.138.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.139.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.139.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.139.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.139.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.139.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.139.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.140.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.140.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.140.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.140.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.140.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.140.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.141.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.141.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.141.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.141.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.141.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.141.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.142.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.142.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.142.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.142.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.142.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.142.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.143.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.143.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.143.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.143.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.143.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.143.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.144.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.144.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.144.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.144.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.144.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.144.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.145.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.145.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.145.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.145.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.145.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.145.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.146.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.146.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.146.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.146.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.146.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.146.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.147.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.147.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.147.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.147.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.147.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.147.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.148.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.148.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.148.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.148.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.148.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.148.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.149.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.149.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.149.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.149.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.149.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.149.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.150.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.150.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.150.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.150.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.150.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.150.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.151.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.151.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.151.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.151.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.151.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.151.down_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.152.gate_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.152.gate_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.152.up_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.152.up_proj.weight_scale_inv": "model-00071-of-000163.safetensors", "model.layers.28.mlp.experts.152.down_proj.weight": "model-00071-of-000163.safetensors", - "model.layers.28.mlp.experts.152.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.153.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.153.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.153.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.153.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.153.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.153.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.154.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.154.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.154.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.154.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.154.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.154.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.155.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.155.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.155.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.155.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.155.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.155.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.156.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.156.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.156.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.156.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.156.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.156.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.157.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.157.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.157.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.157.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.157.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.157.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.158.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.158.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.158.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.158.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.158.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.158.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.159.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.159.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.159.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.159.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.159.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.159.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.160.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.160.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.160.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.160.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.160.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.160.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.161.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.161.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.161.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.161.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.161.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.161.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.162.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.162.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.162.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.162.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.162.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.162.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.163.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.163.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.163.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.163.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.163.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.163.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.164.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.164.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.164.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.164.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.164.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.164.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.165.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.165.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.165.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.165.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.165.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.165.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.166.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.166.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.166.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.166.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.166.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.166.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.167.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.167.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.167.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.167.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.167.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.167.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.168.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.168.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.168.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.168.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.168.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.168.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.169.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.169.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.169.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.169.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.169.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.169.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.170.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.170.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.170.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.170.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.170.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.170.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.171.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.171.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.171.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.171.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.171.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.171.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.172.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.172.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.172.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.172.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.172.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.172.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.173.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.173.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.173.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.173.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.173.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.173.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.174.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.174.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.174.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.174.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.174.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.174.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.175.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.175.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.175.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.175.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.175.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.175.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.176.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.176.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.176.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.176.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.176.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.176.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.177.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.177.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.177.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.177.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.177.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.177.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.178.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.178.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.178.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.178.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.178.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.178.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.179.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.179.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.179.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.179.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.179.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.179.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.180.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.180.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.180.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.180.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.180.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.180.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.181.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.181.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.181.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.181.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.181.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.181.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.182.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.182.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.182.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.182.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.182.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.182.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.183.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.183.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.183.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.183.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.183.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.183.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.184.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.184.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.184.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.184.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.184.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.184.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.185.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.185.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.185.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.185.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.185.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.185.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.186.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.186.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.186.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.186.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.186.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.186.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.187.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.187.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.187.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.187.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.187.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.187.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.188.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.188.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.188.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.188.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.188.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.188.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.189.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.189.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.189.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.189.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.189.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.189.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.190.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.190.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.190.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.190.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.190.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.190.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.191.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.191.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.191.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.191.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.191.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.191.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.192.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.192.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.192.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.192.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.192.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.192.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.193.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.193.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.193.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.193.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.193.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.193.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.194.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.194.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.194.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.194.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.194.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.194.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.195.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.195.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.195.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.195.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.195.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.195.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.196.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.196.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.196.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.196.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.196.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.196.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.197.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.197.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.197.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.197.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.197.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.197.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.198.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.198.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.198.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.198.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.198.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.198.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.199.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.199.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.199.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.199.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.199.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.199.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.200.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.200.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.200.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.200.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.200.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.200.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.201.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.201.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.201.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.201.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.201.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.201.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.202.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.202.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.202.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.202.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.202.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.202.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.203.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.203.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.203.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.203.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.203.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.203.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.204.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.204.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.204.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.204.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.204.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.204.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.205.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.205.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.205.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.205.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.205.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.205.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.206.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.206.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.206.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.206.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.206.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.206.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.207.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.207.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.207.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.207.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.207.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.207.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.208.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.208.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.208.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.208.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.208.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.208.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.209.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.209.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.209.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.209.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.209.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.209.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.210.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.210.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.210.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.210.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.210.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.210.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.211.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.211.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.211.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.211.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.211.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.211.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.212.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.212.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.212.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.212.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.212.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.212.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.213.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.213.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.213.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.213.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.213.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.213.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.214.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.214.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.214.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.214.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.214.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.214.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.215.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.215.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.215.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.215.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.215.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.215.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.216.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.216.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.216.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.216.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.216.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.216.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.217.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.217.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.217.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.217.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.217.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.217.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.218.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.218.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.218.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.218.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.218.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.218.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.219.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.219.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.219.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.219.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.219.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.219.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.220.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.220.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.220.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.220.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.220.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.220.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.221.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.221.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.221.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.221.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.221.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.221.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.222.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.222.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.222.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.222.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.222.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.222.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.223.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.223.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.223.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.223.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.223.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.223.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.224.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.224.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.224.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.224.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.224.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.224.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.225.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.225.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.225.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.225.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.225.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.225.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.226.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.226.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.226.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.226.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.226.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.226.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.227.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.227.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.227.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.227.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.227.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.227.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.228.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.228.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.228.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.228.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.228.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.228.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.229.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.229.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.229.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.229.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.229.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.229.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.230.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.230.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.230.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.230.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.230.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.230.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.231.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.231.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.231.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.231.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.231.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.231.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.232.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.232.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.232.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.232.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.232.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.232.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.233.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.233.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.233.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.233.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.233.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.233.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.234.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.234.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.234.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.234.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.234.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.234.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.235.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.235.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.235.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.235.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.235.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.235.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.236.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.236.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.236.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.236.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.236.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.236.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.237.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.237.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.237.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.237.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.237.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.237.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.238.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.238.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.238.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.238.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.238.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.238.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.239.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.239.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.239.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.239.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.239.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.239.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.240.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.240.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.240.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.240.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.240.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.240.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.241.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.241.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.241.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.241.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.241.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.241.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.242.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.242.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.242.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.242.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.242.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.242.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.243.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.243.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.243.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.243.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.243.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.243.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.244.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.244.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.244.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.244.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.244.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.244.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.245.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.245.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.245.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.245.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.245.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.245.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.246.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.246.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.246.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.246.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.246.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.246.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.247.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.247.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.247.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.247.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.247.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.247.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.248.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.248.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.248.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.248.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.248.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.248.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.249.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.249.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.249.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.249.up_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.249.down_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.249.down_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.250.gate_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.250.gate_proj.weight_scale_inv": "model-00072-of-000163.safetensors", "model.layers.28.mlp.experts.250.up_proj.weight": "model-00072-of-000163.safetensors", - "model.layers.28.mlp.experts.250.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.250.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.250.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.251.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.251.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.251.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.251.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.251.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.251.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.252.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.252.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.252.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.252.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.252.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.252.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.253.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.253.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.253.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.253.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.253.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.253.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.254.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.254.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.254.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.254.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.254.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.254.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.255.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.255.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.255.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.255.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.mlp.experts.255.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.28.mlp.experts.255.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.28.input_layernorm.weight": "model-00073-of-000163.safetensors", "model.layers.28.post_attention_layernorm.weight": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.q_a_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.self_attn.q_a_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.q_a_layernorm.weight": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.q_b_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.self_attn.q_b_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.kv_a_proj_with_mqa.weight": "model-00073-of-000163.safetensors", - "model.layers.29.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.kv_a_layernorm.weight": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.kv_b_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.self_attn.kv_b_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.self_attn.o_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.self_attn.o_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.gate.weight": "model-00073-of-000163.safetensors", "model.layers.29.mlp.gate.e_score_correction_bias": "model-00073-of-000163.safetensors", "model.layers.29.mlp.shared_experts.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.shared_experts.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.shared_experts.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.shared_experts.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.shared_experts.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.0.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.0.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.0.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.0.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.0.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.0.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.1.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.1.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.1.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.1.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.1.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.1.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.2.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.2.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.2.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.2.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.2.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.2.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.3.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.3.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.3.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.3.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.3.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.3.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.4.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.4.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.4.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.4.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.4.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.4.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.5.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.5.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.5.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.5.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.5.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.5.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.6.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.6.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.6.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.6.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.6.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.6.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.7.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.7.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.7.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.7.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.7.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.7.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.8.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.8.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.8.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.8.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.8.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.8.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.9.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.9.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.9.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.9.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.9.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.9.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.10.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.10.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.10.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.10.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.10.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.10.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.11.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.11.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.11.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.11.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.11.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.11.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.12.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.12.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.12.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.12.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.12.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.12.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.13.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.13.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.13.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.13.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.13.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.13.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.14.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.14.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.14.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.14.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.14.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.14.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.15.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.15.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.15.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.15.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.15.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.15.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.16.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.16.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.16.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.16.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.16.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.16.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.17.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.17.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.17.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.17.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.17.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.17.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.18.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.18.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.18.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.18.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.18.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.18.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.19.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.19.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.19.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.19.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.19.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.19.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.20.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.20.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.20.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.20.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.20.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.20.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.21.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.21.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.21.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.21.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.21.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.21.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.22.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.22.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.22.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.22.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.22.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.22.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.23.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.23.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.23.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.23.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.23.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.23.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.24.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.24.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.24.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.24.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.24.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.24.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.25.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.25.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.25.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.25.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.25.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.25.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.26.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.26.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.26.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.26.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.26.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.26.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.27.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.27.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.27.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.27.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.27.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.27.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.28.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.28.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.28.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.28.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.28.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.28.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.29.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.29.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.29.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.29.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.29.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.29.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.30.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.30.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.30.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.30.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.30.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.30.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.31.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.31.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.31.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.31.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.31.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.31.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.32.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.32.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.32.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.32.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.32.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.32.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.33.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.33.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.33.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.33.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.33.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.33.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.34.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.34.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.34.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.34.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.34.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.34.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.35.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.35.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.35.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.35.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.35.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.35.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.36.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.36.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.36.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.36.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.36.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.36.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.37.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.37.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.37.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.37.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.37.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.37.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.38.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.38.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.38.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.38.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.38.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.38.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.39.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.39.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.39.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.39.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.39.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.39.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.40.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.40.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.40.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.40.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.40.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.40.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.41.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.41.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.41.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.41.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.41.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.41.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.42.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.42.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.42.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.42.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.42.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.42.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.43.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.43.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.43.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.43.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.43.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.43.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.44.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.44.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.44.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.44.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.44.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.44.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.45.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.45.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.45.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.45.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.45.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.45.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.46.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.46.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.46.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.46.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.46.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.46.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.47.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.47.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.47.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.47.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.47.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.47.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.48.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.48.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.48.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.48.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.48.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.48.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.49.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.49.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.49.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.49.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.49.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.49.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.50.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.50.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.50.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.50.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.50.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.50.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.51.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.51.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.51.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.51.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.51.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.51.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.52.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.52.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.52.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.52.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.52.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.52.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.53.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.53.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.53.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.53.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.53.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.53.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.54.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.54.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.54.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.54.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.54.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.54.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.55.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.55.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.55.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.55.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.55.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.55.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.56.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.56.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.56.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.56.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.56.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.56.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.57.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.57.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.57.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.57.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.57.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.57.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.58.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.58.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.58.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.58.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.58.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.58.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.59.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.59.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.59.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.59.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.59.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.59.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.60.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.60.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.60.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.60.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.60.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.60.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.61.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.61.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.61.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.61.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.61.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.61.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.62.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.62.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.62.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.62.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.62.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.62.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.63.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.63.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.63.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.63.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.63.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.63.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.64.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.64.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.64.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.64.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.64.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.64.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.65.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.65.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.65.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.65.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.65.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.65.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.66.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.66.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.66.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.66.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.66.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.66.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.67.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.67.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.67.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.67.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.67.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.67.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.68.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.68.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.68.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.68.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.68.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.68.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.69.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.69.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.69.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.69.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.69.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.69.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.70.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.70.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.70.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.70.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.70.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.70.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.71.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.71.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.71.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.71.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.71.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.71.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.72.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.72.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.72.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.72.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.72.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.72.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.73.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.73.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.73.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.73.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.73.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.73.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.74.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.74.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.74.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.74.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.74.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.74.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.75.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.75.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.75.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.75.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.75.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.75.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.76.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.76.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.76.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.76.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.76.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.76.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.77.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.77.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.77.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.77.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.77.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.77.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.78.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.78.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.78.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.78.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.78.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.78.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.79.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.79.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.79.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.79.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.79.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.79.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.80.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.80.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.80.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.80.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.80.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.80.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.81.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.81.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.81.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.81.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.81.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.81.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.82.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.82.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.82.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.82.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.82.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.82.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.83.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.83.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.83.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.83.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.83.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.83.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.84.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.84.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.84.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.84.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.84.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.84.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.85.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.85.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.85.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.85.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.85.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.85.down_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.86.gate_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.86.gate_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.86.up_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.86.up_proj.weight_scale_inv": "model-00073-of-000163.safetensors", "model.layers.29.mlp.experts.86.down_proj.weight": "model-00073-of-000163.safetensors", - "model.layers.29.mlp.experts.86.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.87.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.87.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.87.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.87.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.87.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.87.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.88.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.88.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.88.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.88.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.88.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.88.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.89.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.89.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.89.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.89.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.89.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.89.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.90.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.90.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.90.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.90.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.90.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.90.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.91.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.91.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.91.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.91.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.91.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.91.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.92.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.92.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.92.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.92.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.92.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.92.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.93.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.93.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.93.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.93.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.93.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.93.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.94.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.94.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.94.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.94.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.94.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.94.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.95.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.95.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.95.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.95.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.95.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.95.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.96.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.96.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.96.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.96.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.96.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.96.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.97.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.97.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.97.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.97.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.97.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.97.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.98.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.98.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.98.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.98.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.98.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.98.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.99.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.99.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.99.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.99.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.99.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.99.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.100.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.100.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.100.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.100.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.100.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.100.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.101.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.101.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.101.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.101.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.101.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.101.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.102.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.102.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.102.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.102.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.102.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.102.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.103.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.103.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.103.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.103.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.103.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.103.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.104.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.104.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.104.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.104.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.104.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.104.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.105.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.105.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.105.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.105.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.105.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.105.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.106.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.106.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.106.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.106.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.106.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.106.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.107.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.107.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.107.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.107.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.107.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.107.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.108.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.108.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.108.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.108.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.108.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.108.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.109.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.109.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.109.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.109.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.109.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.109.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.110.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.110.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.110.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.110.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.110.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.110.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.111.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.111.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.111.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.111.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.111.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.111.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.112.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.112.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.112.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.112.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.112.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.112.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.113.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.113.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.113.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.113.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.113.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.113.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.114.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.114.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.114.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.114.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.114.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.114.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.115.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.115.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.115.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.115.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.115.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.115.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.116.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.116.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.116.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.116.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.116.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.116.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.117.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.117.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.117.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.117.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.117.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.117.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.118.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.118.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.118.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.118.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.118.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.118.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.119.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.119.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.119.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.119.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.119.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.119.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.120.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.120.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.120.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.120.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.120.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.120.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.121.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.121.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.121.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.121.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.121.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.121.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.122.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.122.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.122.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.122.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.122.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.122.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.123.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.123.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.123.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.123.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.123.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.123.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.124.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.124.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.124.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.124.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.124.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.124.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.125.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.125.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.125.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.125.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.125.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.125.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.126.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.126.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.126.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.126.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.126.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.126.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.127.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.127.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.127.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.127.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.127.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.127.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.128.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.128.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.128.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.128.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.128.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.128.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.129.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.129.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.129.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.129.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.129.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.129.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.130.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.130.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.130.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.130.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.130.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.130.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.131.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.131.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.131.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.131.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.131.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.131.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.132.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.132.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.132.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.132.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.132.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.132.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.133.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.133.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.133.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.133.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.133.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.133.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.134.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.134.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.134.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.134.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.134.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.134.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.135.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.135.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.135.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.135.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.135.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.135.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.136.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.136.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.136.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.136.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.136.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.136.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.137.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.137.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.137.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.137.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.137.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.137.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.138.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.138.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.138.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.138.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.138.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.138.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.139.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.139.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.139.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.139.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.139.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.139.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.140.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.140.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.140.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.140.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.140.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.140.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.141.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.141.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.141.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.141.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.141.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.141.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.142.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.142.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.142.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.142.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.142.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.142.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.143.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.143.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.143.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.143.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.143.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.143.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.144.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.144.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.144.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.144.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.144.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.144.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.145.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.145.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.145.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.145.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.145.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.145.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.146.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.146.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.146.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.146.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.146.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.146.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.147.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.147.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.147.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.147.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.147.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.147.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.148.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.148.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.148.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.148.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.148.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.148.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.149.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.149.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.149.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.149.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.149.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.149.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.150.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.150.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.150.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.150.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.150.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.150.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.151.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.151.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.151.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.151.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.151.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.151.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.152.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.152.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.152.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.152.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.152.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.152.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.153.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.153.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.153.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.153.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.153.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.153.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.154.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.154.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.154.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.154.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.154.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.154.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.155.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.155.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.155.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.155.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.155.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.155.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.156.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.156.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.156.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.156.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.156.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.156.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.157.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.157.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.157.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.157.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.157.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.157.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.158.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.158.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.158.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.158.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.158.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.158.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.159.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.159.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.159.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.159.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.159.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.159.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.160.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.160.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.160.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.160.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.160.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.160.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.161.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.161.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.161.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.161.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.161.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.161.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.162.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.162.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.162.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.162.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.162.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.162.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.163.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.163.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.163.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.163.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.163.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.163.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.164.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.164.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.164.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.164.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.164.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.164.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.165.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.165.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.165.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.165.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.165.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.165.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.166.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.166.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.166.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.166.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.166.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.166.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.167.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.167.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.167.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.167.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.167.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.167.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.168.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.168.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.168.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.168.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.168.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.168.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.169.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.169.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.169.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.169.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.169.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.169.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.170.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.170.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.170.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.170.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.170.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.170.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.171.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.171.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.171.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.171.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.171.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.171.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.172.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.172.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.172.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.172.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.172.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.172.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.173.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.173.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.173.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.173.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.173.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.173.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.174.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.174.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.174.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.174.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.174.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.174.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.175.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.175.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.175.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.175.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.175.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.175.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.176.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.176.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.176.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.176.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.176.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.176.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.177.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.177.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.177.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.177.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.177.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.177.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.178.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.178.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.178.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.178.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.178.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.178.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.179.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.179.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.179.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.179.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.179.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.179.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.180.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.180.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.180.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.180.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.180.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.180.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.181.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.181.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.181.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.181.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.181.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.181.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.182.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.182.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.182.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.182.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.182.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.182.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.183.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.183.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.183.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.183.up_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.183.down_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.183.down_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.184.gate_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.184.gate_proj.weight_scale_inv": "model-00074-of-000163.safetensors", "model.layers.29.mlp.experts.184.up_proj.weight": "model-00074-of-000163.safetensors", - "model.layers.29.mlp.experts.184.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.184.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.184.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.185.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.185.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.185.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.185.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.185.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.185.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.186.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.186.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.186.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.186.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.186.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.186.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.187.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.187.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.187.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.187.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.187.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.187.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.188.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.188.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.188.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.188.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.188.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.188.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.189.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.189.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.189.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.189.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.189.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.189.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.190.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.190.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.190.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.190.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.190.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.190.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.191.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.191.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.191.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.191.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.191.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.191.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.192.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.192.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.192.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.192.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.192.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.192.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.193.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.193.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.193.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.193.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.193.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.193.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.194.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.194.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.194.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.194.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.194.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.194.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.195.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.195.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.195.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.195.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.195.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.195.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.196.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.196.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.196.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.196.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.196.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.196.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.197.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.197.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.197.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.197.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.197.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.197.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.198.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.198.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.198.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.198.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.198.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.198.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.199.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.199.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.199.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.199.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.199.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.199.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.200.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.200.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.200.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.200.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.200.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.200.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.201.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.201.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.201.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.201.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.201.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.201.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.202.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.202.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.202.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.202.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.202.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.202.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.203.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.203.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.203.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.203.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.203.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.203.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.204.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.204.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.204.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.204.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.204.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.204.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.205.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.205.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.205.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.205.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.205.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.205.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.206.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.206.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.206.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.206.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.206.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.206.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.207.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.207.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.207.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.207.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.207.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.207.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.208.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.208.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.208.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.208.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.208.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.208.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.209.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.209.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.209.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.209.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.209.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.209.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.210.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.210.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.210.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.210.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.210.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.210.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.211.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.211.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.211.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.211.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.211.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.211.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.212.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.212.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.212.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.212.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.212.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.212.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.213.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.213.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.213.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.213.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.213.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.213.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.214.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.214.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.214.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.214.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.214.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.214.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.215.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.215.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.215.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.215.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.215.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.215.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.216.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.216.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.216.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.216.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.216.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.216.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.217.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.217.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.217.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.217.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.217.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.217.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.218.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.218.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.218.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.218.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.218.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.218.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.219.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.219.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.219.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.219.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.219.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.219.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.220.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.220.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.220.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.220.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.220.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.220.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.221.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.221.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.221.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.221.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.221.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.221.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.222.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.222.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.222.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.222.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.222.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.222.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.223.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.223.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.223.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.223.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.223.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.223.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.224.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.224.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.224.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.224.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.224.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.224.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.225.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.225.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.225.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.225.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.225.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.225.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.226.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.226.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.226.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.226.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.226.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.226.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.227.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.227.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.227.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.227.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.227.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.227.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.228.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.228.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.228.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.228.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.228.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.228.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.229.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.229.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.229.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.229.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.229.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.229.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.230.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.230.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.230.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.230.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.230.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.230.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.231.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.231.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.231.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.231.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.231.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.231.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.232.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.232.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.232.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.232.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.232.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.232.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.233.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.233.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.233.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.233.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.233.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.233.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.234.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.234.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.234.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.234.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.234.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.234.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.235.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.235.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.235.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.235.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.235.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.235.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.236.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.236.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.236.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.236.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.236.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.236.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.237.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.237.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.237.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.237.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.237.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.237.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.238.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.238.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.238.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.238.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.238.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.238.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.239.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.239.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.239.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.239.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.239.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.239.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.240.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.240.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.240.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.240.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.240.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.240.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.241.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.241.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.241.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.241.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.241.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.241.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.242.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.242.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.242.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.242.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.242.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.242.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.243.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.243.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.243.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.243.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.243.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.243.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.244.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.244.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.244.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.244.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.244.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.244.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.245.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.245.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.245.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.245.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.245.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.245.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.246.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.246.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.246.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.246.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.246.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.246.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.247.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.247.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.247.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.247.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.247.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.247.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.248.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.248.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.248.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.248.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.248.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.248.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.249.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.249.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.249.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.249.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.249.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.249.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.250.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.250.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.250.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.250.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.250.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.250.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.251.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.251.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.251.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.251.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.251.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.251.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.252.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.252.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.252.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.252.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.252.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.252.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.253.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.253.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.253.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.253.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.253.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.253.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.254.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.254.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.254.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.254.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.254.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.254.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.255.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.255.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.255.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.255.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.mlp.experts.255.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.29.mlp.experts.255.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.29.input_layernorm.weight": "model-00075-of-000163.safetensors", "model.layers.29.post_attention_layernorm.weight": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.q_a_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.self_attn.q_a_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.q_a_layernorm.weight": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.q_b_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.self_attn.q_b_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.kv_a_proj_with_mqa.weight": "model-00075-of-000163.safetensors", - "model.layers.30.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.kv_a_layernorm.weight": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.kv_b_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.self_attn.kv_b_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.self_attn.o_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.self_attn.o_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.gate.weight": "model-00075-of-000163.safetensors", "model.layers.30.mlp.gate.e_score_correction_bias": "model-00075-of-000163.safetensors", "model.layers.30.mlp.shared_experts.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.shared_experts.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.shared_experts.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.shared_experts.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.shared_experts.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.0.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.0.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.0.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.0.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.0.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.0.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.1.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.1.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.1.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.1.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.1.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.1.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.2.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.2.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.2.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.2.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.2.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.2.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.3.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.3.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.3.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.3.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.3.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.3.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.4.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.4.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.4.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.4.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.4.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.4.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.5.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.5.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.5.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.5.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.5.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.5.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.6.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.6.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.6.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.6.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.6.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.6.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.7.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.7.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.7.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.7.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.7.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.7.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.8.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.8.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.8.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.8.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.8.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.8.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.9.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.9.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.9.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.9.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.9.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.9.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.10.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.10.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.10.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.10.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.10.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.10.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.11.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.11.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.11.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.11.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.11.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.11.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.12.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.12.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.12.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.12.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.12.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.12.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.13.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.13.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.13.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.13.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.13.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.13.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.14.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.14.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.14.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.14.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.14.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.14.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.15.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.15.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.15.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.15.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.15.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.15.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.16.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.16.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.16.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.16.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.16.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.16.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.17.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.17.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.17.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.17.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.17.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.17.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.18.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.18.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.18.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.18.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.18.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.18.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.19.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.19.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.19.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.19.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.19.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.19.down_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.20.gate_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.20.gate_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.20.up_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.20.up_proj.weight_scale_inv": "model-00075-of-000163.safetensors", "model.layers.30.mlp.experts.20.down_proj.weight": "model-00075-of-000163.safetensors", - "model.layers.30.mlp.experts.20.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.21.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.21.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.21.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.21.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.21.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.21.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.22.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.22.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.22.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.22.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.22.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.22.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.23.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.23.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.23.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.23.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.23.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.23.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.24.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.24.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.24.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.24.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.24.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.24.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.25.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.25.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.25.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.25.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.25.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.25.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.26.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.26.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.26.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.26.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.26.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.26.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.27.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.27.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.27.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.27.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.27.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.27.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.28.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.28.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.28.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.28.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.28.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.28.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.29.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.29.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.29.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.29.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.29.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.29.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.30.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.30.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.30.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.30.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.30.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.30.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.31.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.31.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.31.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.31.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.31.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.31.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.32.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.32.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.32.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.32.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.32.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.32.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.33.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.33.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.33.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.33.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.33.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.33.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.34.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.34.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.34.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.34.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.34.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.34.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.35.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.35.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.35.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.35.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.35.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.35.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.36.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.36.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.36.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.36.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.36.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.36.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.37.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.37.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.37.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.37.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.37.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.37.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.38.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.38.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.38.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.38.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.38.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.38.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.39.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.39.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.39.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.39.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.39.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.39.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.40.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.40.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.40.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.40.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.40.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.40.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.41.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.41.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.41.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.41.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.41.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.41.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.42.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.42.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.42.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.42.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.42.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.42.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.43.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.43.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.43.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.43.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.43.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.43.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.44.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.44.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.44.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.44.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.44.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.44.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.45.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.45.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.45.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.45.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.45.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.45.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.46.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.46.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.46.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.46.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.46.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.46.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.47.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.47.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.47.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.47.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.47.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.47.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.48.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.48.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.48.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.48.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.48.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.48.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.49.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.49.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.49.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.49.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.49.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.49.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.50.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.50.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.50.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.50.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.50.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.50.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.51.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.51.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.51.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.51.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.51.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.51.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.52.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.52.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.52.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.52.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.52.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.52.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.53.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.53.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.53.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.53.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.53.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.53.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.54.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.54.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.54.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.54.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.54.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.54.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.55.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.55.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.55.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.55.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.55.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.55.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.56.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.56.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.56.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.56.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.56.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.56.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.57.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.57.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.57.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.57.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.57.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.57.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.58.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.58.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.58.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.58.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.58.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.58.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.59.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.59.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.59.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.59.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.59.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.59.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.60.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.60.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.60.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.60.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.60.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.60.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.61.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.61.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.61.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.61.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.61.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.61.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.62.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.62.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.62.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.62.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.62.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.62.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.63.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.63.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.63.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.63.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.63.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.63.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.64.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.64.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.64.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.64.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.64.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.64.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.65.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.65.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.65.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.65.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.65.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.65.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.66.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.66.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.66.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.66.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.66.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.66.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.67.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.67.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.67.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.67.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.67.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.67.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.68.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.68.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.68.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.68.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.68.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.68.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.69.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.69.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.69.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.69.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.69.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.69.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.70.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.70.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.70.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.70.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.70.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.70.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.71.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.71.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.71.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.71.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.71.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.71.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.72.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.72.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.72.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.72.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.72.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.72.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.73.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.73.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.73.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.73.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.73.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.73.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.74.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.74.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.74.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.74.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.74.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.74.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.75.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.75.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.75.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.75.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.75.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.75.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.76.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.76.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.76.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.76.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.76.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.76.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.77.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.77.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.77.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.77.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.77.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.77.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.78.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.78.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.78.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.78.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.78.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.78.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.79.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.79.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.79.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.79.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.79.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.79.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.80.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.80.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.80.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.80.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.80.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.80.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.81.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.81.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.81.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.81.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.81.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.81.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.82.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.82.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.82.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.82.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.82.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.82.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.83.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.83.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.83.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.83.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.83.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.83.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.84.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.84.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.84.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.84.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.84.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.84.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.85.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.85.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.85.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.85.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.85.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.85.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.86.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.86.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.86.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.86.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.86.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.86.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.87.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.87.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.87.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.87.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.87.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.87.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.88.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.88.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.88.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.88.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.88.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.88.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.89.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.89.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.89.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.89.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.89.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.89.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.90.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.90.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.90.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.90.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.90.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.90.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.91.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.91.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.91.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.91.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.91.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.91.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.92.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.92.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.92.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.92.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.92.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.92.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.93.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.93.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.93.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.93.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.93.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.93.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.94.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.94.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.94.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.94.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.94.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.94.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.95.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.95.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.95.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.95.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.95.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.95.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.96.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.96.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.96.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.96.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.96.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.96.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.97.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.97.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.97.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.97.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.97.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.97.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.98.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.98.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.98.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.98.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.98.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.98.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.99.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.99.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.99.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.99.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.99.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.99.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.100.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.100.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.100.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.100.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.100.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.100.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.101.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.101.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.101.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.101.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.101.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.101.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.102.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.102.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.102.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.102.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.102.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.102.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.103.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.103.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.103.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.103.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.103.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.103.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.104.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.104.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.104.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.104.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.104.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.104.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.105.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.105.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.105.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.105.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.105.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.105.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.106.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.106.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.106.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.106.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.106.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.106.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.107.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.107.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.107.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.107.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.107.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.107.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.108.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.108.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.108.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.108.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.108.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.108.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.109.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.109.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.109.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.109.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.109.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.109.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.110.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.110.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.110.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.110.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.110.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.110.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.111.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.111.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.111.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.111.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.111.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.111.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.112.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.112.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.112.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.112.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.112.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.112.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.113.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.113.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.113.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.113.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.113.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.113.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.114.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.114.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.114.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.114.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.114.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.114.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.115.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.115.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.115.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.115.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.115.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.115.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.116.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.116.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.116.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.116.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.116.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.116.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.117.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.117.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.117.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.117.up_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.117.down_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.117.down_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.118.gate_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.118.gate_proj.weight_scale_inv": "model-00076-of-000163.safetensors", "model.layers.30.mlp.experts.118.up_proj.weight": "model-00076-of-000163.safetensors", - "model.layers.30.mlp.experts.118.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.118.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.118.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.119.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.119.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.119.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.119.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.119.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.119.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.120.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.120.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.120.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.120.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.120.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.120.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.121.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.121.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.121.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.121.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.121.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.121.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.122.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.122.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.122.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.122.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.122.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.122.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.123.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.123.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.123.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.123.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.123.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.123.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.124.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.124.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.124.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.124.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.124.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.124.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.125.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.125.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.125.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.125.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.125.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.125.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.126.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.126.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.126.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.126.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.126.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.126.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.127.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.127.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.127.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.127.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.127.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.127.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.128.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.128.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.128.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.128.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.128.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.128.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.129.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.129.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.129.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.129.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.129.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.129.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.130.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.130.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.130.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.130.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.130.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.130.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.131.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.131.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.131.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.131.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.131.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.131.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.132.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.132.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.132.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.132.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.132.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.132.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.133.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.133.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.133.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.133.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.133.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.133.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.134.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.134.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.134.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.134.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.134.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.134.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.135.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.135.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.135.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.135.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.135.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.135.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.136.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.136.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.136.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.136.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.136.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.136.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.137.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.137.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.137.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.137.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.137.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.137.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.138.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.138.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.138.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.138.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.138.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.138.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.139.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.139.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.139.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.139.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.139.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.139.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.140.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.140.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.140.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.140.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.140.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.140.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.141.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.141.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.141.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.141.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.141.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.141.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.142.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.142.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.142.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.142.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.142.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.142.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.143.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.143.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.143.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.143.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.143.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.143.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.144.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.144.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.144.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.144.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.144.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.144.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.145.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.145.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.145.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.145.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.145.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.145.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.146.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.146.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.146.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.146.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.146.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.146.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.147.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.147.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.147.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.147.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.147.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.147.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.148.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.148.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.148.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.148.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.148.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.148.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.149.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.149.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.149.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.149.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.149.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.149.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.150.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.150.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.150.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.150.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.150.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.150.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.151.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.151.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.151.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.151.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.151.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.151.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.152.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.152.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.152.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.152.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.152.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.152.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.153.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.153.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.153.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.153.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.153.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.153.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.154.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.154.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.154.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.154.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.154.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.154.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.155.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.155.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.155.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.155.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.155.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.155.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.156.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.156.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.156.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.156.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.156.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.156.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.157.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.157.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.157.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.157.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.157.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.157.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.158.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.158.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.158.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.158.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.158.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.158.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.159.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.159.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.159.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.159.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.159.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.159.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.160.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.160.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.160.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.160.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.160.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.160.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.161.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.161.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.161.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.161.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.161.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.161.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.162.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.162.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.162.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.162.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.162.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.162.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.163.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.163.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.163.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.163.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.163.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.163.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.164.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.164.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.164.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.164.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.164.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.164.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.165.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.165.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.165.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.165.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.165.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.165.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.166.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.166.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.166.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.166.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.166.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.166.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.167.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.167.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.167.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.167.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.167.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.167.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.168.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.168.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.168.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.168.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.168.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.168.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.169.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.169.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.169.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.169.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.169.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.169.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.170.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.170.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.170.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.170.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.170.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.170.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.171.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.171.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.171.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.171.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.171.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.171.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.172.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.172.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.172.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.172.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.172.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.172.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.173.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.173.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.173.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.173.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.173.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.173.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.174.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.174.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.174.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.174.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.174.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.174.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.175.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.175.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.175.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.175.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.175.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.175.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.176.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.176.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.176.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.176.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.176.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.176.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.177.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.177.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.177.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.177.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.177.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.177.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.178.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.178.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.178.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.178.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.178.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.178.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.179.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.179.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.179.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.179.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.179.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.179.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.180.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.180.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.180.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.180.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.180.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.180.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.181.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.181.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.181.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.181.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.181.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.181.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.182.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.182.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.182.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.182.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.182.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.182.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.183.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.183.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.183.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.183.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.183.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.183.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.184.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.184.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.184.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.184.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.184.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.184.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.185.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.185.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.185.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.185.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.185.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.185.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.186.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.186.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.186.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.186.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.186.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.186.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.187.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.187.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.187.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.187.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.187.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.187.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.188.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.188.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.188.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.188.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.188.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.188.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.189.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.189.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.189.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.189.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.189.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.189.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.190.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.190.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.190.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.190.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.190.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.190.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.191.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.191.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.191.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.191.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.191.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.191.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.192.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.192.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.192.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.192.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.192.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.192.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.193.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.193.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.193.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.193.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.193.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.193.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.194.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.194.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.194.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.194.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.194.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.194.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.195.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.195.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.195.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.195.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.195.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.195.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.196.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.196.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.196.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.196.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.196.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.196.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.197.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.197.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.197.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.197.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.197.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.197.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.198.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.198.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.198.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.198.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.198.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.198.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.199.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.199.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.199.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.199.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.199.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.199.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.200.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.200.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.200.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.200.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.200.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.200.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.201.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.201.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.201.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.201.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.201.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.201.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.202.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.202.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.202.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.202.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.202.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.202.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.203.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.203.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.203.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.203.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.203.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.203.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.204.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.204.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.204.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.204.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.204.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.204.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.205.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.205.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.205.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.205.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.205.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.205.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.206.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.206.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.206.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.206.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.206.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.206.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.207.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.207.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.207.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.207.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.207.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.207.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.208.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.208.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.208.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.208.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.208.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.208.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.209.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.209.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.209.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.209.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.209.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.209.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.210.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.210.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.210.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.210.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.210.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.210.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.211.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.211.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.211.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.211.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.211.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.211.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.212.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.212.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.212.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.212.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.212.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.212.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.213.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.213.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.213.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.213.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.213.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.213.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.214.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.214.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.214.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.214.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.214.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.214.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.215.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.215.gate_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.215.up_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.215.up_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.215.down_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.215.down_proj.weight_scale_inv": "model-00077-of-000163.safetensors", "model.layers.30.mlp.experts.216.gate_proj.weight": "model-00077-of-000163.safetensors", - "model.layers.30.mlp.experts.216.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.216.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.216.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.216.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.216.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.217.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.217.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.217.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.217.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.217.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.217.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.218.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.218.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.218.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.218.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.218.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.218.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.219.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.219.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.219.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.219.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.219.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.219.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.220.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.220.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.220.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.220.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.220.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.220.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.221.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.221.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.221.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.221.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.221.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.221.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.222.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.222.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.222.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.222.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.222.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.222.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.223.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.223.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.223.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.223.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.223.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.223.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.224.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.224.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.224.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.224.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.224.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.224.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.225.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.225.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.225.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.225.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.225.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.225.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.226.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.226.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.226.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.226.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.226.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.226.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.227.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.227.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.227.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.227.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.227.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.227.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.228.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.228.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.228.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.228.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.228.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.228.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.229.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.229.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.229.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.229.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.229.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.229.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.230.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.230.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.230.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.230.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.230.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.230.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.231.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.231.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.231.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.231.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.231.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.231.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.232.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.232.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.232.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.232.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.232.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.232.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.233.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.233.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.233.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.233.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.233.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.233.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.234.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.234.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.234.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.234.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.234.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.234.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.235.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.235.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.235.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.235.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.235.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.235.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.236.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.236.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.236.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.236.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.236.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.236.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.237.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.237.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.237.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.237.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.237.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.237.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.238.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.238.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.238.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.238.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.238.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.238.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.239.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.239.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.239.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.239.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.239.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.239.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.240.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.240.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.240.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.240.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.240.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.240.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.241.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.241.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.241.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.241.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.241.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.241.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.242.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.242.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.242.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.242.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.242.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.242.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.243.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.243.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.243.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.243.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.243.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.243.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.244.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.244.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.244.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.244.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.244.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.244.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.245.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.245.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.245.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.245.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.245.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.245.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.246.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.246.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.246.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.246.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.246.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.246.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.247.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.247.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.247.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.247.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.247.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.247.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.248.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.248.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.248.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.248.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.248.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.248.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.249.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.249.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.249.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.249.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.249.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.249.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.250.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.250.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.250.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.250.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.250.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.250.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.251.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.251.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.251.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.251.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.251.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.251.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.252.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.252.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.252.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.252.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.252.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.252.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.253.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.253.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.253.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.253.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.253.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.253.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.254.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.254.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.254.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.254.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.254.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.254.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.255.gate_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.255.gate_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.255.up_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.255.up_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.mlp.experts.255.down_proj.weight": "model-00078-of-000163.safetensors", - "model.layers.30.mlp.experts.255.down_proj.weight_scale_inv": "model-00078-of-000163.safetensors", "model.layers.30.input_layernorm.weight": "model-00078-of-000163.safetensors", "model.layers.30.post_attention_layernorm.weight": "model-00078-of-000163.safetensors", "model.layers.31.self_attn.q_a_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.self_attn.q_a_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.q_a_layernorm.weight": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.q_b_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.self_attn.q_b_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.kv_a_proj_with_mqa.weight": "model-00079-of-000163.safetensors", - "model.layers.31.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.kv_a_layernorm.weight": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.kv_b_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.self_attn.kv_b_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.self_attn.o_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.self_attn.o_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.gate.weight": "model-00079-of-000163.safetensors", "model.layers.31.mlp.gate.e_score_correction_bias": "model-00079-of-000163.safetensors", "model.layers.31.mlp.shared_experts.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.shared_experts.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.shared_experts.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.shared_experts.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.shared_experts.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.0.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.0.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.0.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.0.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.0.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.0.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.1.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.1.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.1.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.1.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.1.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.1.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.2.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.2.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.2.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.2.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.2.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.2.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.3.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.3.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.3.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.3.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.3.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.3.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.4.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.4.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.4.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.4.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.4.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.4.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.5.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.5.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.5.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.5.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.5.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.5.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.6.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.6.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.6.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.6.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.6.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.6.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.7.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.7.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.7.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.7.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.7.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.7.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.8.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.8.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.8.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.8.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.8.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.8.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.9.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.9.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.9.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.9.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.9.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.9.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.10.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.10.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.10.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.10.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.10.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.10.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.11.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.11.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.11.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.11.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.11.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.11.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.12.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.12.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.12.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.12.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.12.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.12.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.13.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.13.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.13.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.13.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.13.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.13.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.14.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.14.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.14.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.14.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.14.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.14.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.15.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.15.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.15.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.15.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.15.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.15.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.16.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.16.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.16.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.16.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.16.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.16.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.17.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.17.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.17.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.17.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.17.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.17.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.18.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.18.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.18.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.18.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.18.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.18.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.19.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.19.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.19.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.19.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.19.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.19.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.20.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.20.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.20.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.20.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.20.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.20.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.21.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.21.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.21.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.21.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.21.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.21.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.22.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.22.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.22.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.22.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.22.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.22.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.23.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.23.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.23.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.23.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.23.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.23.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.24.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.24.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.24.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.24.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.24.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.24.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.25.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.25.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.25.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.25.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.25.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.25.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.26.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.26.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.26.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.26.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.26.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.26.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.27.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.27.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.27.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.27.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.27.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.27.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.28.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.28.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.28.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.28.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.28.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.28.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.29.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.29.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.29.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.29.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.29.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.29.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.30.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.30.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.30.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.30.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.30.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.30.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.31.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.31.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.31.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.31.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.31.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.31.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.32.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.32.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.32.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.32.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.32.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.32.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.33.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.33.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.33.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.33.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.33.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.33.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.34.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.34.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.34.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.34.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.34.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.34.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.35.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.35.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.35.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.35.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.35.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.35.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.36.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.36.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.36.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.36.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.36.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.36.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.37.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.37.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.37.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.37.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.37.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.37.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.38.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.38.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.38.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.38.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.38.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.38.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.39.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.39.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.39.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.39.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.39.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.39.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.40.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.40.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.40.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.40.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.40.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.40.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.41.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.41.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.41.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.41.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.41.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.41.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.42.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.42.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.42.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.42.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.42.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.42.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.43.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.43.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.43.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.43.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.43.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.43.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.44.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.44.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.44.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.44.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.44.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.44.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.45.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.45.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.45.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.45.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.45.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.45.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.46.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.46.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.46.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.46.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.46.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.46.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.47.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.47.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.47.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.47.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.47.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.47.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.48.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.48.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.48.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.48.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.48.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.48.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.49.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.49.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.49.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.49.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.49.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.49.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.50.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.50.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.50.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.50.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.50.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.50.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.51.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.51.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.51.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.51.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.51.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.51.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.52.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.52.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.52.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.52.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.52.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.52.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.53.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.53.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.53.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.53.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.53.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.53.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.54.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.54.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.54.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.54.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.54.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.54.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.55.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.55.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.55.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.55.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.55.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.55.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.56.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.56.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.56.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.56.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.56.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.56.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.57.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.57.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.57.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.57.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.57.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.57.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.58.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.58.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.58.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.58.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.58.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.58.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.59.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.59.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.59.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.59.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.59.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.59.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.60.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.60.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.60.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.60.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.60.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.60.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.61.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.61.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.61.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.61.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.61.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.61.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.62.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.62.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.62.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.62.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.62.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.62.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.63.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.63.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.63.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.63.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.63.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.63.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.64.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.64.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.64.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.64.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.64.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.64.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.65.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.65.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.65.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.65.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.65.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.65.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.66.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.66.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.66.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.66.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.66.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.66.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.67.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.67.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.67.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.67.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.67.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.67.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.68.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.68.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.68.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.68.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.68.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.68.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.69.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.69.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.69.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.69.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.69.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.69.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.70.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.70.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.70.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.70.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.70.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.70.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.71.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.71.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.71.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.71.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.71.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.71.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.72.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.72.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.72.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.72.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.72.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.72.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.73.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.73.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.73.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.73.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.73.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.73.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.74.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.74.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.74.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.74.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.74.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.74.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.75.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.75.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.75.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.75.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.75.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.75.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.76.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.76.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.76.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.76.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.76.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.76.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.77.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.77.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.77.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.77.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.77.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.77.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.78.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.78.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.78.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.78.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.78.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.78.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.79.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.79.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.79.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.79.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.79.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.79.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.80.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.80.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.80.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.80.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.80.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.80.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.81.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.81.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.81.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.81.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.81.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.81.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.82.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.82.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.82.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.82.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.82.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.82.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.83.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.83.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.83.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.83.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.83.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.83.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.84.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.84.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.84.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.84.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.84.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.84.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.85.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.85.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.85.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.85.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.85.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.85.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.86.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.86.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.86.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.86.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.86.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.86.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.87.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.87.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.87.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.87.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.87.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.87.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.88.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.88.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.88.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.88.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.88.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.88.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.89.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.89.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.89.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.89.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.89.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.89.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.90.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.90.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.90.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.90.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.90.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.90.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.91.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.91.gate_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.91.up_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.91.up_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.91.down_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.91.down_proj.weight_scale_inv": "model-00079-of-000163.safetensors", "model.layers.31.mlp.experts.92.gate_proj.weight": "model-00079-of-000163.safetensors", - "model.layers.31.mlp.experts.92.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.92.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.92.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.92.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.92.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.93.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.93.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.93.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.93.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.93.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.93.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.94.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.94.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.94.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.94.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.94.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.94.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.95.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.95.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.95.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.95.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.95.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.95.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.96.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.96.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.96.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.96.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.96.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.96.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.97.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.97.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.97.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.97.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.97.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.97.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.98.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.98.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.98.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.98.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.98.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.98.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.99.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.99.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.99.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.99.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.99.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.99.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.100.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.100.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.100.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.100.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.100.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.100.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.101.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.101.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.101.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.101.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.101.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.101.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.102.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.102.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.102.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.102.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.102.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.102.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.103.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.103.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.103.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.103.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.103.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.103.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.104.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.104.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.104.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.104.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.104.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.104.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.105.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.105.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.105.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.105.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.105.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.105.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.106.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.106.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.106.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.106.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.106.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.106.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.107.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.107.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.107.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.107.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.107.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.107.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.108.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.108.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.108.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.108.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.108.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.108.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.109.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.109.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.109.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.109.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.109.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.109.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.110.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.110.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.110.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.110.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.110.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.110.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.111.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.111.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.111.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.111.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.111.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.111.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.112.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.112.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.112.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.112.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.112.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.112.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.113.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.113.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.113.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.113.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.113.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.113.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.114.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.114.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.114.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.114.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.114.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.114.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.115.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.115.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.115.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.115.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.115.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.115.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.116.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.116.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.116.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.116.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.116.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.116.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.117.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.117.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.117.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.117.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.117.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.117.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.118.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.118.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.118.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.118.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.118.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.118.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.119.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.119.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.119.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.119.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.119.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.119.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.120.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.120.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.120.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.120.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.120.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.120.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.121.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.121.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.121.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.121.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.121.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.121.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.122.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.122.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.122.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.122.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.122.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.122.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.123.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.123.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.123.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.123.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.123.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.123.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.124.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.124.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.124.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.124.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.124.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.124.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.125.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.125.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.125.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.125.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.125.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.125.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.126.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.126.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.126.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.126.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.126.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.126.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.127.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.127.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.127.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.127.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.127.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.127.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.128.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.128.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.128.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.128.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.128.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.128.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.129.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.129.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.129.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.129.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.129.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.129.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.130.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.130.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.130.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.130.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.130.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.130.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.131.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.131.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.131.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.131.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.131.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.131.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.132.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.132.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.132.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.132.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.132.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.132.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.133.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.133.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.133.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.133.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.133.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.133.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.134.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.134.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.134.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.134.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.134.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.134.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.135.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.135.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.135.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.135.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.135.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.135.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.136.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.136.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.136.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.136.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.136.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.136.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.137.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.137.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.137.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.137.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.137.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.137.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.138.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.138.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.138.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.138.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.138.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.138.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.139.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.139.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.139.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.139.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.139.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.139.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.140.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.140.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.140.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.140.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.140.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.140.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.141.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.141.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.141.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.141.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.141.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.141.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.142.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.142.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.142.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.142.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.142.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.142.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.143.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.143.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.143.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.143.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.143.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.143.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.144.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.144.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.144.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.144.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.144.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.144.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.145.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.145.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.145.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.145.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.145.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.145.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.146.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.146.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.146.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.146.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.146.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.146.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.147.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.147.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.147.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.147.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.147.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.147.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.148.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.148.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.148.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.148.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.148.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.148.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.149.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.149.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.149.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.149.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.149.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.149.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.150.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.150.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.150.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.150.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.150.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.150.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.151.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.151.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.151.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.151.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.151.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.151.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.152.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.152.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.152.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.152.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.152.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.152.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.153.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.153.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.153.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.153.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.153.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.153.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.154.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.154.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.154.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.154.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.154.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.154.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.155.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.155.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.155.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.155.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.155.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.155.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.156.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.156.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.156.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.156.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.156.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.156.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.157.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.157.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.157.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.157.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.157.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.157.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.158.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.158.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.158.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.158.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.158.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.158.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.159.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.159.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.159.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.159.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.159.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.159.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.160.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.160.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.160.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.160.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.160.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.160.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.161.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.161.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.161.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.161.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.161.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.161.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.162.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.162.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.162.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.162.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.162.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.162.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.163.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.163.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.163.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.163.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.163.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.163.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.164.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.164.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.164.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.164.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.164.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.164.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.165.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.165.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.165.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.165.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.165.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.165.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.166.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.166.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.166.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.166.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.166.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.166.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.167.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.167.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.167.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.167.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.167.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.167.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.168.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.168.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.168.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.168.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.168.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.168.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.169.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.169.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.169.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.169.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.169.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.169.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.170.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.170.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.170.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.170.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.170.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.170.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.171.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.171.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.171.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.171.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.171.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.171.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.172.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.172.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.172.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.172.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.172.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.172.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.173.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.173.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.173.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.173.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.173.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.173.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.174.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.174.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.174.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.174.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.174.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.174.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.175.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.175.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.175.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.175.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.175.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.175.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.176.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.176.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.176.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.176.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.176.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.176.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.177.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.177.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.177.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.177.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.177.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.177.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.178.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.178.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.178.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.178.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.178.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.178.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.179.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.179.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.179.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.179.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.179.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.179.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.180.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.180.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.180.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.180.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.180.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.180.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.181.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.181.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.181.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.181.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.181.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.181.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.182.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.182.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.182.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.182.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.182.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.182.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.183.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.183.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.183.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.183.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.183.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.183.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.184.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.184.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.184.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.184.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.184.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.184.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.185.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.185.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.185.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.185.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.185.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.185.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.186.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.186.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.186.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.186.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.186.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.186.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.187.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.187.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.187.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.187.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.187.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.187.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.188.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.188.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.188.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.188.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.188.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.188.down_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.189.gate_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.189.gate_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.189.up_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.189.up_proj.weight_scale_inv": "model-00080-of-000163.safetensors", "model.layers.31.mlp.experts.189.down_proj.weight": "model-00080-of-000163.safetensors", - "model.layers.31.mlp.experts.189.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.190.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.190.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.190.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.190.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.190.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.190.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.191.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.191.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.191.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.191.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.191.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.191.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.192.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.192.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.192.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.192.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.192.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.192.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.193.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.193.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.193.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.193.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.193.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.193.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.194.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.194.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.194.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.194.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.194.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.194.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.195.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.195.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.195.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.195.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.195.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.195.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.196.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.196.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.196.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.196.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.196.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.196.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.197.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.197.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.197.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.197.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.197.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.197.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.198.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.198.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.198.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.198.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.198.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.198.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.199.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.199.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.199.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.199.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.199.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.199.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.200.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.200.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.200.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.200.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.200.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.200.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.201.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.201.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.201.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.201.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.201.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.201.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.202.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.202.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.202.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.202.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.202.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.202.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.203.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.203.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.203.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.203.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.203.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.203.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.204.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.204.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.204.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.204.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.204.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.204.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.205.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.205.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.205.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.205.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.205.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.205.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.206.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.206.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.206.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.206.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.206.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.206.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.207.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.207.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.207.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.207.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.207.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.207.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.208.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.208.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.208.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.208.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.208.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.208.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.209.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.209.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.209.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.209.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.209.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.209.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.210.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.210.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.210.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.210.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.210.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.210.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.211.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.211.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.211.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.211.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.211.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.211.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.212.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.212.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.212.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.212.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.212.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.212.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.213.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.213.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.213.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.213.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.213.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.213.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.214.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.214.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.214.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.214.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.214.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.214.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.215.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.215.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.215.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.215.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.215.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.215.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.216.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.216.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.216.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.216.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.216.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.216.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.217.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.217.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.217.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.217.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.217.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.217.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.218.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.218.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.218.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.218.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.218.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.218.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.219.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.219.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.219.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.219.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.219.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.219.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.220.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.220.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.220.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.220.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.220.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.220.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.221.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.221.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.221.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.221.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.221.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.221.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.222.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.222.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.222.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.222.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.222.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.222.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.223.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.223.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.223.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.223.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.223.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.223.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.224.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.224.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.224.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.224.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.224.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.224.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.225.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.225.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.225.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.225.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.225.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.225.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.226.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.226.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.226.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.226.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.226.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.226.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.227.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.227.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.227.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.227.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.227.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.227.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.228.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.228.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.228.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.228.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.228.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.228.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.229.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.229.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.229.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.229.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.229.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.229.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.230.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.230.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.230.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.230.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.230.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.230.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.231.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.231.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.231.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.231.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.231.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.231.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.232.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.232.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.232.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.232.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.232.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.232.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.233.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.233.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.233.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.233.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.233.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.233.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.234.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.234.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.234.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.234.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.234.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.234.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.235.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.235.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.235.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.235.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.235.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.235.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.236.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.236.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.236.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.236.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.236.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.236.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.237.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.237.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.237.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.237.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.237.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.237.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.238.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.238.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.238.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.238.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.238.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.238.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.239.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.239.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.239.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.239.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.239.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.239.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.240.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.240.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.240.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.240.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.240.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.240.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.241.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.241.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.241.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.241.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.241.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.241.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.242.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.242.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.242.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.242.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.242.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.242.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.243.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.243.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.243.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.243.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.243.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.243.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.244.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.244.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.244.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.244.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.244.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.244.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.245.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.245.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.245.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.245.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.245.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.245.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.246.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.246.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.246.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.246.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.246.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.246.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.247.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.247.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.247.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.247.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.247.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.247.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.248.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.248.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.248.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.248.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.248.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.248.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.249.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.249.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.249.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.249.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.249.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.249.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.250.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.250.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.250.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.250.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.250.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.250.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.251.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.251.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.251.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.251.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.251.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.251.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.252.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.252.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.252.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.252.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.252.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.252.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.253.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.253.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.253.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.253.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.253.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.253.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.254.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.254.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.254.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.254.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.254.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.254.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.255.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.255.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.255.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.255.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.mlp.experts.255.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.31.mlp.experts.255.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.31.input_layernorm.weight": "model-00081-of-000163.safetensors", "model.layers.31.post_attention_layernorm.weight": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.q_a_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.self_attn.q_a_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.q_a_layernorm.weight": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.q_b_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.self_attn.q_b_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.kv_a_proj_with_mqa.weight": "model-00081-of-000163.safetensors", - "model.layers.32.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.kv_a_layernorm.weight": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.kv_b_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.self_attn.kv_b_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.self_attn.o_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.self_attn.o_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.gate.weight": "model-00081-of-000163.safetensors", "model.layers.32.mlp.gate.e_score_correction_bias": "model-00081-of-000163.safetensors", "model.layers.32.mlp.shared_experts.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.shared_experts.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.shared_experts.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.shared_experts.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.shared_experts.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.0.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.0.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.0.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.0.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.0.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.0.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.1.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.1.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.1.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.1.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.1.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.1.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.2.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.2.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.2.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.2.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.2.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.2.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.3.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.3.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.3.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.3.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.3.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.3.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.4.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.4.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.4.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.4.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.4.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.4.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.5.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.5.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.5.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.5.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.5.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.5.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.6.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.6.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.6.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.6.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.6.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.6.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.7.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.7.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.7.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.7.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.7.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.7.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.8.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.8.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.8.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.8.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.8.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.8.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.9.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.9.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.9.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.9.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.9.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.9.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.10.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.10.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.10.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.10.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.10.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.10.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.11.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.11.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.11.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.11.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.11.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.11.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.12.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.12.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.12.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.12.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.12.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.12.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.13.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.13.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.13.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.13.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.13.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.13.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.14.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.14.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.14.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.14.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.14.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.14.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.15.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.15.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.15.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.15.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.15.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.15.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.16.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.16.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.16.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.16.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.16.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.16.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.17.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.17.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.17.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.17.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.17.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.17.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.18.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.18.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.18.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.18.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.18.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.18.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.19.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.19.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.19.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.19.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.19.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.19.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.20.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.20.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.20.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.20.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.20.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.20.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.21.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.21.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.21.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.21.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.21.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.21.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.22.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.22.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.22.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.22.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.22.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.22.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.23.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.23.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.23.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.23.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.23.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.23.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.24.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.24.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.24.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.24.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.24.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.24.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.25.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.25.gate_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.25.up_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.25.up_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.25.down_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.25.down_proj.weight_scale_inv": "model-00081-of-000163.safetensors", "model.layers.32.mlp.experts.26.gate_proj.weight": "model-00081-of-000163.safetensors", - "model.layers.32.mlp.experts.26.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.26.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.26.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.26.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.26.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.27.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.27.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.27.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.27.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.27.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.27.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.28.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.28.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.28.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.28.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.28.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.28.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.29.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.29.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.29.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.29.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.29.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.29.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.30.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.30.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.30.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.30.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.30.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.30.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.31.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.31.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.31.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.31.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.31.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.31.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.32.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.32.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.32.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.32.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.32.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.32.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.33.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.33.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.33.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.33.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.33.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.33.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.34.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.34.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.34.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.34.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.34.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.34.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.35.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.35.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.35.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.35.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.35.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.35.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.36.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.36.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.36.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.36.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.36.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.36.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.37.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.37.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.37.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.37.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.37.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.37.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.38.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.38.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.38.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.38.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.38.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.38.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.39.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.39.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.39.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.39.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.39.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.39.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.40.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.40.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.40.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.40.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.40.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.40.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.41.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.41.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.41.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.41.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.41.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.41.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.42.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.42.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.42.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.42.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.42.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.42.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.43.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.43.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.43.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.43.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.43.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.43.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.44.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.44.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.44.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.44.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.44.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.44.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.45.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.45.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.45.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.45.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.45.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.45.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.46.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.46.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.46.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.46.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.46.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.46.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.47.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.47.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.47.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.47.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.47.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.47.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.48.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.48.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.48.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.48.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.48.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.48.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.49.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.49.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.49.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.49.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.49.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.49.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.50.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.50.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.50.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.50.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.50.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.50.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.51.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.51.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.51.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.51.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.51.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.51.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.52.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.52.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.52.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.52.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.52.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.52.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.53.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.53.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.53.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.53.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.53.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.53.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.54.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.54.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.54.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.54.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.54.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.54.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.55.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.55.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.55.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.55.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.55.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.55.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.56.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.56.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.56.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.56.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.56.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.56.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.57.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.57.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.57.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.57.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.57.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.57.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.58.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.58.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.58.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.58.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.58.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.58.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.59.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.59.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.59.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.59.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.59.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.59.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.60.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.60.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.60.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.60.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.60.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.60.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.61.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.61.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.61.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.61.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.61.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.61.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.62.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.62.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.62.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.62.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.62.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.62.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.63.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.63.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.63.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.63.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.63.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.63.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.64.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.64.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.64.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.64.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.64.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.64.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.65.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.65.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.65.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.65.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.65.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.65.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.66.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.66.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.66.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.66.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.66.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.66.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.67.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.67.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.67.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.67.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.67.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.67.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.68.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.68.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.68.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.68.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.68.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.68.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.69.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.69.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.69.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.69.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.69.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.69.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.70.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.70.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.70.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.70.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.70.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.70.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.71.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.71.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.71.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.71.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.71.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.71.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.72.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.72.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.72.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.72.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.72.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.72.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.73.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.73.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.73.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.73.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.73.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.73.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.74.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.74.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.74.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.74.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.74.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.74.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.75.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.75.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.75.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.75.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.75.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.75.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.76.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.76.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.76.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.76.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.76.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.76.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.77.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.77.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.77.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.77.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.77.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.77.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.78.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.78.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.78.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.78.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.78.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.78.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.79.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.79.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.79.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.79.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.79.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.79.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.80.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.80.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.80.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.80.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.80.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.80.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.81.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.81.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.81.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.81.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.81.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.81.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.82.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.82.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.82.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.82.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.82.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.82.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.83.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.83.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.83.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.83.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.83.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.83.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.84.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.84.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.84.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.84.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.84.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.84.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.85.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.85.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.85.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.85.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.85.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.85.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.86.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.86.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.86.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.86.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.86.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.86.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.87.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.87.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.87.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.87.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.87.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.87.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.88.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.88.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.88.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.88.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.88.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.88.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.89.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.89.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.89.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.89.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.89.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.89.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.90.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.90.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.90.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.90.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.90.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.90.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.91.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.91.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.91.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.91.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.91.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.91.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.92.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.92.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.92.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.92.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.92.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.92.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.93.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.93.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.93.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.93.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.93.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.93.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.94.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.94.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.94.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.94.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.94.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.94.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.95.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.95.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.95.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.95.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.95.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.95.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.96.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.96.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.96.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.96.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.96.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.96.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.97.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.97.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.97.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.97.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.97.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.97.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.98.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.98.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.98.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.98.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.98.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.98.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.99.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.99.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.99.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.99.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.99.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.99.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.100.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.100.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.100.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.100.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.100.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.100.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.101.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.101.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.101.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.101.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.101.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.101.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.102.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.102.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.102.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.102.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.102.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.102.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.103.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.103.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.103.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.103.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.103.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.103.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.104.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.104.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.104.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.104.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.104.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.104.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.105.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.105.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.105.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.105.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.105.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.105.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.106.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.106.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.106.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.106.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.106.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.106.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.107.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.107.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.107.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.107.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.107.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.107.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.108.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.108.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.108.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.108.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.108.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.108.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.109.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.109.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.109.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.109.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.109.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.109.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.110.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.110.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.110.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.110.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.110.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.110.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.111.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.111.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.111.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.111.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.111.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.111.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.112.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.112.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.112.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.112.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.112.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.112.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.113.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.113.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.113.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.113.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.113.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.113.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.114.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.114.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.114.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.114.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.114.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.114.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.115.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.115.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.115.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.115.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.115.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.115.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.116.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.116.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.116.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.116.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.116.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.116.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.117.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.117.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.117.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.117.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.117.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.117.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.118.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.118.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.118.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.118.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.118.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.118.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.119.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.119.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.119.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.119.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.119.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.119.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.120.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.120.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.120.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.120.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.120.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.120.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.121.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.121.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.121.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.121.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.121.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.121.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.122.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.122.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.122.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.122.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.122.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.122.down_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.123.gate_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.123.gate_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.123.up_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.123.up_proj.weight_scale_inv": "model-00082-of-000163.safetensors", "model.layers.32.mlp.experts.123.down_proj.weight": "model-00082-of-000163.safetensors", - "model.layers.32.mlp.experts.123.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.124.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.124.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.124.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.124.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.124.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.124.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.125.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.125.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.125.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.125.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.125.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.125.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.126.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.126.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.126.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.126.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.126.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.126.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.127.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.127.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.127.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.127.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.127.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.127.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.128.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.128.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.128.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.128.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.128.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.128.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.129.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.129.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.129.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.129.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.129.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.129.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.130.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.130.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.130.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.130.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.130.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.130.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.131.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.131.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.131.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.131.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.131.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.131.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.132.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.132.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.132.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.132.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.132.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.132.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.133.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.133.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.133.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.133.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.133.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.133.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.134.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.134.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.134.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.134.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.134.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.134.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.135.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.135.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.135.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.135.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.135.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.135.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.136.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.136.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.136.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.136.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.136.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.136.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.137.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.137.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.137.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.137.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.137.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.137.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.138.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.138.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.138.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.138.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.138.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.138.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.139.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.139.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.139.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.139.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.139.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.139.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.140.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.140.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.140.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.140.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.140.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.140.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.141.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.141.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.141.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.141.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.141.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.141.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.142.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.142.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.142.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.142.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.142.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.142.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.143.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.143.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.143.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.143.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.143.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.143.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.144.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.144.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.144.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.144.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.144.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.144.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.145.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.145.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.145.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.145.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.145.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.145.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.146.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.146.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.146.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.146.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.146.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.146.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.147.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.147.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.147.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.147.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.147.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.147.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.148.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.148.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.148.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.148.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.148.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.148.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.149.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.149.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.149.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.149.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.149.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.149.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.150.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.150.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.150.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.150.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.150.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.150.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.151.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.151.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.151.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.151.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.151.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.151.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.152.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.152.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.152.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.152.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.152.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.152.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.153.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.153.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.153.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.153.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.153.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.153.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.154.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.154.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.154.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.154.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.154.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.154.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.155.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.155.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.155.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.155.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.155.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.155.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.156.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.156.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.156.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.156.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.156.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.156.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.157.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.157.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.157.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.157.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.157.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.157.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.158.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.158.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.158.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.158.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.158.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.158.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.159.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.159.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.159.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.159.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.159.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.159.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.160.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.160.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.160.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.160.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.160.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.160.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.161.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.161.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.161.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.161.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.161.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.161.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.162.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.162.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.162.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.162.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.162.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.162.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.163.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.163.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.163.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.163.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.163.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.163.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.164.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.164.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.164.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.164.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.164.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.164.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.165.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.165.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.165.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.165.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.165.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.165.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.166.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.166.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.166.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.166.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.166.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.166.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.167.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.167.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.167.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.167.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.167.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.167.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.168.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.168.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.168.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.168.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.168.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.168.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.169.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.169.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.169.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.169.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.169.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.169.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.170.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.170.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.170.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.170.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.170.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.170.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.171.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.171.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.171.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.171.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.171.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.171.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.172.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.172.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.172.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.172.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.172.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.172.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.173.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.173.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.173.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.173.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.173.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.173.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.174.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.174.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.174.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.174.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.174.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.174.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.175.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.175.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.175.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.175.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.175.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.175.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.176.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.176.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.176.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.176.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.176.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.176.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.177.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.177.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.177.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.177.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.177.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.177.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.178.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.178.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.178.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.178.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.178.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.178.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.179.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.179.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.179.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.179.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.179.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.179.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.180.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.180.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.180.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.180.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.180.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.180.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.181.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.181.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.181.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.181.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.181.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.181.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.182.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.182.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.182.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.182.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.182.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.182.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.183.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.183.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.183.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.183.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.183.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.183.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.184.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.184.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.184.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.184.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.184.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.184.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.185.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.185.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.185.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.185.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.185.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.185.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.186.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.186.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.186.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.186.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.186.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.186.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.187.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.187.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.187.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.187.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.187.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.187.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.188.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.188.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.188.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.188.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.188.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.188.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.189.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.189.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.189.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.189.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.189.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.189.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.190.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.190.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.190.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.190.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.190.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.190.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.191.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.191.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.191.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.191.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.191.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.191.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.192.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.192.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.192.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.192.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.192.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.192.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.193.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.193.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.193.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.193.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.193.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.193.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.194.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.194.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.194.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.194.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.194.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.194.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.195.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.195.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.195.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.195.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.195.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.195.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.196.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.196.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.196.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.196.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.196.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.196.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.197.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.197.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.197.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.197.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.197.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.197.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.198.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.198.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.198.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.198.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.198.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.198.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.199.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.199.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.199.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.199.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.199.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.199.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.200.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.200.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.200.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.200.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.200.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.200.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.201.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.201.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.201.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.201.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.201.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.201.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.202.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.202.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.202.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.202.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.202.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.202.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.203.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.203.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.203.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.203.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.203.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.203.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.204.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.204.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.204.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.204.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.204.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.204.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.205.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.205.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.205.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.205.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.205.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.205.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.206.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.206.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.206.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.206.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.206.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.206.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.207.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.207.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.207.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.207.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.207.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.207.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.208.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.208.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.208.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.208.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.208.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.208.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.209.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.209.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.209.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.209.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.209.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.209.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.210.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.210.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.210.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.210.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.210.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.210.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.211.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.211.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.211.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.211.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.211.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.211.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.212.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.212.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.212.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.212.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.212.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.212.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.213.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.213.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.213.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.213.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.213.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.213.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.214.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.214.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.214.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.214.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.214.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.214.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.215.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.215.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.215.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.215.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.215.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.215.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.216.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.216.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.216.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.216.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.216.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.216.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.217.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.217.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.217.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.217.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.217.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.217.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.218.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.218.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.218.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.218.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.218.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.218.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.219.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.219.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.219.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.219.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.219.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.219.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.220.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.220.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.220.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.220.up_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.220.down_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.220.down_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.221.gate_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.221.gate_proj.weight_scale_inv": "model-00083-of-000163.safetensors", "model.layers.32.mlp.experts.221.up_proj.weight": "model-00083-of-000163.safetensors", - "model.layers.32.mlp.experts.221.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.221.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.221.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.222.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.222.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.222.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.222.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.222.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.222.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.223.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.223.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.223.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.223.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.223.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.223.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.224.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.224.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.224.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.224.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.224.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.224.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.225.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.225.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.225.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.225.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.225.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.225.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.226.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.226.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.226.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.226.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.226.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.226.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.227.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.227.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.227.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.227.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.227.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.227.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.228.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.228.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.228.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.228.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.228.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.228.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.229.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.229.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.229.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.229.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.229.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.229.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.230.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.230.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.230.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.230.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.230.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.230.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.231.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.231.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.231.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.231.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.231.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.231.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.232.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.232.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.232.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.232.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.232.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.232.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.233.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.233.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.233.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.233.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.233.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.233.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.234.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.234.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.234.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.234.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.234.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.234.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.235.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.235.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.235.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.235.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.235.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.235.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.236.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.236.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.236.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.236.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.236.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.236.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.237.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.237.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.237.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.237.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.237.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.237.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.238.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.238.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.238.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.238.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.238.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.238.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.239.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.239.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.239.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.239.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.239.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.239.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.240.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.240.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.240.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.240.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.240.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.240.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.241.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.241.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.241.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.241.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.241.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.241.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.242.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.242.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.242.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.242.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.242.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.242.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.243.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.243.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.243.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.243.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.243.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.243.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.244.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.244.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.244.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.244.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.244.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.244.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.245.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.245.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.245.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.245.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.245.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.245.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.246.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.246.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.246.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.246.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.246.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.246.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.247.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.247.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.247.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.247.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.247.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.247.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.248.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.248.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.248.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.248.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.248.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.248.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.249.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.249.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.249.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.249.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.249.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.249.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.250.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.250.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.250.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.250.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.250.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.250.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.251.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.251.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.251.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.251.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.251.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.251.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.252.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.252.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.252.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.252.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.252.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.252.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.253.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.253.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.253.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.253.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.253.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.253.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.254.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.254.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.254.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.254.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.254.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.254.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.255.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.255.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.255.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.255.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.mlp.experts.255.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.32.mlp.experts.255.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.32.input_layernorm.weight": "model-00084-of-000163.safetensors", "model.layers.32.post_attention_layernorm.weight": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.q_a_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.self_attn.q_a_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.q_a_layernorm.weight": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.q_b_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.self_attn.q_b_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.kv_a_proj_with_mqa.weight": "model-00084-of-000163.safetensors", - "model.layers.33.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.kv_a_layernorm.weight": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.kv_b_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.self_attn.kv_b_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.self_attn.o_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.self_attn.o_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.gate.weight": "model-00084-of-000163.safetensors", "model.layers.33.mlp.gate.e_score_correction_bias": "model-00084-of-000163.safetensors", "model.layers.33.mlp.shared_experts.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.shared_experts.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.shared_experts.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.shared_experts.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.shared_experts.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.0.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.0.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.0.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.0.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.0.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.0.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.1.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.1.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.1.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.1.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.1.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.1.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.2.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.2.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.2.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.2.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.2.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.2.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.3.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.3.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.3.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.3.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.3.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.3.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.4.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.4.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.4.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.4.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.4.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.4.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.5.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.5.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.5.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.5.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.5.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.5.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.6.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.6.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.6.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.6.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.6.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.6.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.7.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.7.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.7.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.7.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.7.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.7.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.8.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.8.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.8.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.8.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.8.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.8.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.9.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.9.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.9.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.9.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.9.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.9.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.10.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.10.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.10.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.10.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.10.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.10.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.11.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.11.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.11.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.11.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.11.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.11.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.12.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.12.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.12.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.12.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.12.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.12.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.13.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.13.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.13.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.13.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.13.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.13.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.14.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.14.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.14.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.14.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.14.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.14.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.15.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.15.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.15.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.15.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.15.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.15.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.16.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.16.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.16.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.16.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.16.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.16.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.17.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.17.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.17.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.17.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.17.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.17.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.18.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.18.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.18.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.18.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.18.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.18.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.19.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.19.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.19.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.19.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.19.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.19.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.20.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.20.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.20.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.20.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.20.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.20.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.21.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.21.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.21.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.21.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.21.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.21.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.22.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.22.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.22.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.22.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.22.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.22.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.23.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.23.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.23.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.23.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.23.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.23.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.24.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.24.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.24.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.24.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.24.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.24.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.25.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.25.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.25.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.25.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.25.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.25.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.26.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.26.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.26.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.26.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.26.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.26.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.27.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.27.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.27.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.27.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.27.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.27.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.28.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.28.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.28.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.28.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.28.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.28.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.29.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.29.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.29.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.29.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.29.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.29.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.30.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.30.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.30.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.30.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.30.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.30.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.31.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.31.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.31.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.31.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.31.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.31.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.32.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.32.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.32.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.32.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.32.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.32.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.33.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.33.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.33.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.33.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.33.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.33.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.34.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.34.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.34.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.34.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.34.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.34.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.35.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.35.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.35.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.35.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.35.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.35.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.36.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.36.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.36.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.36.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.36.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.36.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.37.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.37.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.37.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.37.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.37.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.37.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.38.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.38.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.38.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.38.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.38.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.38.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.39.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.39.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.39.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.39.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.39.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.39.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.40.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.40.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.40.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.40.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.40.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.40.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.41.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.41.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.41.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.41.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.41.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.41.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.42.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.42.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.42.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.42.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.42.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.42.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.43.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.43.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.43.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.43.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.43.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.43.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.44.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.44.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.44.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.44.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.44.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.44.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.45.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.45.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.45.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.45.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.45.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.45.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.46.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.46.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.46.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.46.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.46.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.46.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.47.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.47.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.47.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.47.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.47.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.47.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.48.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.48.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.48.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.48.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.48.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.48.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.49.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.49.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.49.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.49.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.49.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.49.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.50.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.50.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.50.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.50.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.50.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.50.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.51.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.51.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.51.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.51.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.51.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.51.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.52.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.52.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.52.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.52.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.52.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.52.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.53.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.53.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.53.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.53.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.53.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.53.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.54.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.54.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.54.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.54.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.54.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.54.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.55.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.55.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.55.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.55.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.55.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.55.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.56.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.56.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.56.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.56.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.56.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.56.down_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.57.gate_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.57.gate_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.57.up_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.57.up_proj.weight_scale_inv": "model-00084-of-000163.safetensors", "model.layers.33.mlp.experts.57.down_proj.weight": "model-00084-of-000163.safetensors", - "model.layers.33.mlp.experts.57.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.58.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.58.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.58.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.58.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.58.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.58.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.59.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.59.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.59.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.59.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.59.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.59.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.60.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.60.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.60.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.60.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.60.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.60.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.61.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.61.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.61.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.61.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.61.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.61.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.62.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.62.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.62.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.62.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.62.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.62.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.63.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.63.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.63.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.63.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.63.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.63.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.64.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.64.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.64.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.64.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.64.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.64.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.65.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.65.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.65.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.65.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.65.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.65.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.66.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.66.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.66.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.66.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.66.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.66.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.67.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.67.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.67.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.67.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.67.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.67.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.68.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.68.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.68.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.68.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.68.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.68.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.69.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.69.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.69.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.69.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.69.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.69.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.70.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.70.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.70.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.70.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.70.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.70.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.71.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.71.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.71.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.71.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.71.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.71.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.72.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.72.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.72.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.72.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.72.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.72.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.73.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.73.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.73.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.73.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.73.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.73.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.74.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.74.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.74.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.74.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.74.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.74.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.75.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.75.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.75.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.75.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.75.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.75.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.76.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.76.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.76.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.76.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.76.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.76.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.77.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.77.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.77.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.77.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.77.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.77.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.78.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.78.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.78.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.78.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.78.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.78.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.79.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.79.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.79.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.79.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.79.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.79.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.80.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.80.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.80.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.80.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.80.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.80.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.81.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.81.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.81.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.81.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.81.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.81.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.82.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.82.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.82.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.82.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.82.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.82.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.83.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.83.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.83.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.83.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.83.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.83.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.84.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.84.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.84.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.84.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.84.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.84.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.85.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.85.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.85.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.85.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.85.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.85.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.86.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.86.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.86.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.86.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.86.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.86.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.87.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.87.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.87.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.87.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.87.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.87.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.88.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.88.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.88.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.88.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.88.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.88.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.89.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.89.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.89.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.89.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.89.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.89.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.90.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.90.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.90.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.90.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.90.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.90.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.91.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.91.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.91.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.91.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.91.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.91.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.92.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.92.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.92.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.92.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.92.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.92.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.93.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.93.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.93.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.93.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.93.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.93.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.94.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.94.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.94.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.94.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.94.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.94.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.95.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.95.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.95.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.95.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.95.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.95.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.96.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.96.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.96.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.96.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.96.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.96.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.97.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.97.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.97.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.97.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.97.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.97.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.98.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.98.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.98.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.98.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.98.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.98.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.99.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.99.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.99.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.99.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.99.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.99.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.100.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.100.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.100.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.100.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.100.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.100.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.101.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.101.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.101.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.101.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.101.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.101.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.102.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.102.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.102.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.102.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.102.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.102.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.103.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.103.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.103.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.103.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.103.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.103.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.104.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.104.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.104.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.104.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.104.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.104.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.105.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.105.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.105.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.105.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.105.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.105.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.106.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.106.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.106.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.106.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.106.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.106.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.107.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.107.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.107.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.107.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.107.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.107.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.108.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.108.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.108.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.108.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.108.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.108.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.109.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.109.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.109.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.109.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.109.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.109.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.110.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.110.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.110.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.110.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.110.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.110.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.111.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.111.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.111.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.111.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.111.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.111.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.112.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.112.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.112.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.112.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.112.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.112.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.113.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.113.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.113.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.113.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.113.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.113.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.114.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.114.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.114.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.114.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.114.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.114.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.115.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.115.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.115.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.115.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.115.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.115.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.116.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.116.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.116.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.116.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.116.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.116.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.117.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.117.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.117.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.117.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.117.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.117.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.118.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.118.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.118.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.118.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.118.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.118.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.119.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.119.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.119.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.119.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.119.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.119.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.120.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.120.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.120.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.120.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.120.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.120.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.121.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.121.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.121.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.121.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.121.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.121.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.122.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.122.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.122.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.122.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.122.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.122.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.123.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.123.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.123.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.123.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.123.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.123.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.124.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.124.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.124.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.124.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.124.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.124.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.125.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.125.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.125.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.125.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.125.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.125.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.126.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.126.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.126.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.126.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.126.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.126.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.127.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.127.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.127.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.127.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.127.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.127.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.128.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.128.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.128.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.128.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.128.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.128.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.129.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.129.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.129.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.129.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.129.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.129.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.130.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.130.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.130.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.130.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.130.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.130.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.131.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.131.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.131.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.131.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.131.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.131.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.132.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.132.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.132.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.132.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.132.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.132.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.133.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.133.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.133.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.133.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.133.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.133.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.134.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.134.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.134.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.134.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.134.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.134.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.135.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.135.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.135.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.135.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.135.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.135.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.136.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.136.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.136.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.136.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.136.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.136.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.137.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.137.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.137.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.137.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.137.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.137.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.138.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.138.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.138.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.138.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.138.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.138.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.139.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.139.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.139.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.139.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.139.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.139.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.140.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.140.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.140.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.140.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.140.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.140.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.141.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.141.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.141.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.141.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.141.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.141.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.142.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.142.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.142.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.142.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.142.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.142.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.143.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.143.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.143.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.143.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.143.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.143.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.144.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.144.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.144.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.144.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.144.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.144.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.145.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.145.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.145.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.145.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.145.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.145.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.146.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.146.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.146.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.146.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.146.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.146.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.147.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.147.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.147.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.147.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.147.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.147.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.148.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.148.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.148.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.148.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.148.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.148.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.149.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.149.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.149.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.149.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.149.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.149.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.150.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.150.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.150.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.150.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.150.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.150.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.151.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.151.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.151.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.151.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.151.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.151.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.152.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.152.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.152.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.152.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.152.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.152.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.153.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.153.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.153.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.153.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.153.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.153.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.154.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.154.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.154.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.154.up_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.154.down_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.154.down_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.155.gate_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.155.gate_proj.weight_scale_inv": "model-00085-of-000163.safetensors", "model.layers.33.mlp.experts.155.up_proj.weight": "model-00085-of-000163.safetensors", - "model.layers.33.mlp.experts.155.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.155.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.155.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.156.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.156.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.156.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.156.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.156.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.156.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.157.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.157.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.157.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.157.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.157.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.157.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.158.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.158.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.158.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.158.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.158.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.158.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.159.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.159.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.159.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.159.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.159.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.159.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.160.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.160.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.160.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.160.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.160.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.160.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.161.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.161.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.161.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.161.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.161.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.161.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.162.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.162.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.162.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.162.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.162.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.162.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.163.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.163.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.163.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.163.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.163.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.163.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.164.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.164.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.164.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.164.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.164.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.164.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.165.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.165.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.165.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.165.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.165.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.165.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.166.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.166.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.166.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.166.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.166.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.166.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.167.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.167.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.167.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.167.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.167.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.167.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.168.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.168.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.168.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.168.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.168.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.168.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.169.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.169.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.169.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.169.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.169.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.169.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.170.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.170.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.170.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.170.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.170.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.170.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.171.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.171.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.171.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.171.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.171.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.171.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.172.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.172.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.172.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.172.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.172.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.172.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.173.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.173.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.173.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.173.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.173.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.173.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.174.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.174.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.174.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.174.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.174.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.174.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.175.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.175.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.175.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.175.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.175.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.175.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.176.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.176.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.176.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.176.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.176.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.176.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.177.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.177.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.177.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.177.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.177.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.177.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.178.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.178.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.178.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.178.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.178.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.178.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.179.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.179.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.179.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.179.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.179.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.179.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.180.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.180.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.180.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.180.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.180.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.180.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.181.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.181.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.181.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.181.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.181.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.181.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.182.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.182.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.182.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.182.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.182.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.182.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.183.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.183.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.183.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.183.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.183.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.183.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.184.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.184.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.184.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.184.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.184.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.184.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.185.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.185.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.185.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.185.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.185.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.185.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.186.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.186.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.186.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.186.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.186.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.186.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.187.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.187.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.187.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.187.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.187.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.187.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.188.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.188.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.188.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.188.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.188.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.188.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.189.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.189.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.189.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.189.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.189.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.189.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.190.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.190.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.190.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.190.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.190.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.190.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.191.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.191.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.191.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.191.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.191.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.191.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.192.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.192.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.192.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.192.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.192.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.192.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.193.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.193.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.193.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.193.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.193.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.193.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.194.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.194.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.194.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.194.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.194.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.194.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.195.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.195.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.195.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.195.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.195.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.195.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.196.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.196.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.196.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.196.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.196.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.196.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.197.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.197.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.197.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.197.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.197.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.197.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.198.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.198.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.198.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.198.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.198.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.198.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.199.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.199.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.199.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.199.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.199.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.199.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.200.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.200.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.200.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.200.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.200.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.200.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.201.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.201.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.201.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.201.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.201.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.201.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.202.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.202.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.202.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.202.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.202.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.202.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.203.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.203.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.203.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.203.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.203.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.203.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.204.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.204.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.204.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.204.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.204.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.204.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.205.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.205.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.205.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.205.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.205.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.205.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.206.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.206.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.206.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.206.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.206.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.206.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.207.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.207.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.207.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.207.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.207.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.207.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.208.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.208.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.208.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.208.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.208.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.208.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.209.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.209.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.209.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.209.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.209.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.209.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.210.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.210.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.210.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.210.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.210.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.210.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.211.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.211.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.211.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.211.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.211.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.211.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.212.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.212.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.212.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.212.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.212.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.212.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.213.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.213.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.213.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.213.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.213.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.213.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.214.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.214.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.214.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.214.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.214.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.214.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.215.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.215.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.215.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.215.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.215.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.215.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.216.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.216.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.216.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.216.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.216.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.216.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.217.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.217.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.217.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.217.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.217.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.217.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.218.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.218.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.218.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.218.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.218.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.218.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.219.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.219.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.219.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.219.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.219.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.219.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.220.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.220.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.220.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.220.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.220.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.220.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.221.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.221.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.221.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.221.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.221.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.221.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.222.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.222.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.222.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.222.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.222.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.222.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.223.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.223.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.223.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.223.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.223.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.223.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.224.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.224.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.224.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.224.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.224.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.224.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.225.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.225.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.225.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.225.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.225.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.225.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.226.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.226.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.226.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.226.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.226.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.226.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.227.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.227.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.227.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.227.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.227.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.227.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.228.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.228.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.228.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.228.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.228.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.228.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.229.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.229.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.229.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.229.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.229.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.229.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.230.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.230.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.230.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.230.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.230.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.230.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.231.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.231.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.231.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.231.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.231.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.231.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.232.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.232.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.232.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.232.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.232.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.232.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.233.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.233.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.233.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.233.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.233.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.233.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.234.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.234.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.234.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.234.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.234.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.234.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.235.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.235.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.235.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.235.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.235.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.235.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.236.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.236.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.236.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.236.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.236.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.236.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.237.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.237.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.237.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.237.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.237.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.237.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.238.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.238.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.238.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.238.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.238.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.238.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.239.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.239.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.239.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.239.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.239.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.239.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.240.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.240.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.240.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.240.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.240.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.240.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.241.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.241.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.241.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.241.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.241.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.241.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.242.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.242.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.242.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.242.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.242.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.242.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.243.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.243.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.243.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.243.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.243.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.243.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.244.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.244.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.244.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.244.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.244.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.244.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.245.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.245.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.245.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.245.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.245.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.245.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.246.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.246.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.246.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.246.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.246.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.246.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.247.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.247.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.247.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.247.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.247.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.247.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.248.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.248.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.248.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.248.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.248.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.248.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.249.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.249.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.249.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.249.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.249.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.249.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.250.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.250.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.250.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.250.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.250.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.250.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.251.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.251.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.251.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.251.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.251.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.251.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.252.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.252.gate_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.252.up_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.252.up_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.252.down_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.252.down_proj.weight_scale_inv": "model-00086-of-000163.safetensors", "model.layers.33.mlp.experts.253.gate_proj.weight": "model-00086-of-000163.safetensors", - "model.layers.33.mlp.experts.253.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.253.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.253.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.253.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.253.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.254.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.254.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.254.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.254.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.254.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.254.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.255.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.255.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.255.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.255.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.mlp.experts.255.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.33.mlp.experts.255.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.33.input_layernorm.weight": "model-00087-of-000163.safetensors", "model.layers.33.post_attention_layernorm.weight": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.q_a_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.self_attn.q_a_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.q_a_layernorm.weight": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.q_b_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.self_attn.q_b_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.kv_a_proj_with_mqa.weight": "model-00087-of-000163.safetensors", - "model.layers.34.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.kv_a_layernorm.weight": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.kv_b_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.self_attn.kv_b_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.self_attn.o_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.self_attn.o_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.gate.weight": "model-00087-of-000163.safetensors", "model.layers.34.mlp.gate.e_score_correction_bias": "model-00087-of-000163.safetensors", "model.layers.34.mlp.shared_experts.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.shared_experts.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.shared_experts.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.shared_experts.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.shared_experts.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.0.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.0.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.0.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.0.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.0.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.0.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.1.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.1.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.1.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.1.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.1.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.1.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.2.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.2.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.2.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.2.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.2.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.2.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.3.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.3.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.3.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.3.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.3.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.3.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.4.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.4.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.4.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.4.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.4.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.4.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.5.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.5.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.5.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.5.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.5.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.5.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.6.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.6.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.6.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.6.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.6.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.6.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.7.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.7.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.7.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.7.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.7.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.7.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.8.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.8.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.8.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.8.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.8.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.8.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.9.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.9.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.9.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.9.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.9.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.9.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.10.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.10.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.10.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.10.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.10.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.10.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.11.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.11.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.11.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.11.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.11.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.11.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.12.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.12.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.12.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.12.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.12.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.12.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.13.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.13.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.13.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.13.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.13.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.13.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.14.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.14.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.14.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.14.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.14.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.14.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.15.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.15.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.15.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.15.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.15.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.15.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.16.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.16.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.16.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.16.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.16.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.16.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.17.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.17.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.17.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.17.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.17.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.17.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.18.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.18.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.18.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.18.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.18.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.18.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.19.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.19.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.19.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.19.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.19.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.19.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.20.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.20.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.20.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.20.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.20.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.20.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.21.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.21.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.21.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.21.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.21.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.21.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.22.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.22.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.22.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.22.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.22.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.22.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.23.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.23.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.23.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.23.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.23.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.23.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.24.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.24.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.24.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.24.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.24.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.24.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.25.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.25.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.25.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.25.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.25.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.25.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.26.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.26.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.26.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.26.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.26.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.26.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.27.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.27.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.27.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.27.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.27.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.27.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.28.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.28.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.28.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.28.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.28.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.28.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.29.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.29.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.29.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.29.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.29.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.29.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.30.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.30.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.30.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.30.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.30.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.30.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.31.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.31.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.31.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.31.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.31.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.31.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.32.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.32.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.32.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.32.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.32.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.32.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.33.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.33.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.33.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.33.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.33.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.33.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.34.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.34.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.34.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.34.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.34.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.34.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.35.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.35.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.35.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.35.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.35.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.35.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.36.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.36.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.36.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.36.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.36.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.36.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.37.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.37.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.37.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.37.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.37.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.37.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.38.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.38.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.38.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.38.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.38.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.38.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.39.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.39.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.39.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.39.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.39.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.39.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.40.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.40.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.40.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.40.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.40.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.40.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.41.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.41.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.41.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.41.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.41.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.41.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.42.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.42.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.42.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.42.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.42.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.42.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.43.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.43.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.43.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.43.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.43.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.43.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.44.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.44.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.44.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.44.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.44.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.44.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.45.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.45.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.45.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.45.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.45.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.45.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.46.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.46.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.46.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.46.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.46.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.46.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.47.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.47.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.47.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.47.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.47.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.47.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.48.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.48.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.48.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.48.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.48.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.48.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.49.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.49.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.49.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.49.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.49.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.49.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.50.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.50.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.50.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.50.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.50.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.50.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.51.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.51.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.51.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.51.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.51.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.51.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.52.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.52.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.52.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.52.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.52.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.52.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.53.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.53.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.53.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.53.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.53.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.53.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.54.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.54.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.54.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.54.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.54.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.54.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.55.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.55.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.55.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.55.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.55.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.55.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.56.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.56.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.56.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.56.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.56.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.56.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.57.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.57.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.57.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.57.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.57.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.57.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.58.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.58.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.58.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.58.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.58.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.58.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.59.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.59.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.59.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.59.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.59.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.59.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.60.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.60.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.60.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.60.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.60.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.60.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.61.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.61.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.61.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.61.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.61.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.61.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.62.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.62.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.62.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.62.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.62.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.62.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.63.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.63.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.63.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.63.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.63.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.63.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.64.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.64.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.64.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.64.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.64.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.64.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.65.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.65.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.65.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.65.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.65.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.65.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.66.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.66.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.66.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.66.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.66.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.66.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.67.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.67.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.67.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.67.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.67.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.67.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.68.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.68.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.68.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.68.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.68.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.68.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.69.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.69.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.69.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.69.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.69.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.69.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.70.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.70.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.70.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.70.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.70.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.70.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.71.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.71.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.71.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.71.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.71.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.71.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.72.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.72.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.72.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.72.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.72.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.72.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.73.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.73.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.73.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.73.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.73.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.73.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.74.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.74.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.74.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.74.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.74.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.74.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.75.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.75.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.75.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.75.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.75.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.75.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.76.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.76.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.76.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.76.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.76.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.76.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.77.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.77.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.77.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.77.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.77.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.77.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.78.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.78.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.78.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.78.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.78.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.78.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.79.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.79.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.79.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.79.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.79.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.79.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.80.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.80.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.80.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.80.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.80.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.80.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.81.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.81.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.81.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.81.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.81.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.81.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.82.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.82.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.82.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.82.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.82.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.82.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.83.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.83.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.83.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.83.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.83.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.83.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.84.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.84.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.84.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.84.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.84.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.84.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.85.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.85.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.85.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.85.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.85.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.85.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.86.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.86.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.86.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.86.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.86.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.86.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.87.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.87.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.87.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.87.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.87.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.87.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.88.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.88.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.88.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.88.up_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.88.down_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.88.down_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.89.gate_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.89.gate_proj.weight_scale_inv": "model-00087-of-000163.safetensors", "model.layers.34.mlp.experts.89.up_proj.weight": "model-00087-of-000163.safetensors", - "model.layers.34.mlp.experts.89.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.89.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.89.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.90.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.90.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.90.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.90.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.90.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.90.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.91.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.91.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.91.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.91.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.91.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.91.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.92.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.92.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.92.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.92.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.92.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.92.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.93.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.93.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.93.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.93.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.93.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.93.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.94.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.94.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.94.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.94.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.94.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.94.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.95.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.95.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.95.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.95.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.95.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.95.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.96.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.96.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.96.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.96.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.96.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.96.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.97.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.97.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.97.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.97.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.97.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.97.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.98.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.98.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.98.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.98.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.98.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.98.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.99.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.99.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.99.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.99.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.99.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.99.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.100.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.100.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.100.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.100.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.100.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.100.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.101.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.101.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.101.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.101.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.101.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.101.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.102.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.102.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.102.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.102.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.102.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.102.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.103.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.103.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.103.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.103.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.103.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.103.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.104.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.104.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.104.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.104.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.104.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.104.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.105.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.105.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.105.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.105.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.105.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.105.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.106.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.106.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.106.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.106.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.106.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.106.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.107.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.107.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.107.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.107.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.107.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.107.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.108.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.108.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.108.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.108.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.108.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.108.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.109.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.109.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.109.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.109.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.109.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.109.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.110.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.110.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.110.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.110.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.110.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.110.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.111.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.111.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.111.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.111.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.111.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.111.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.112.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.112.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.112.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.112.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.112.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.112.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.113.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.113.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.113.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.113.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.113.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.113.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.114.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.114.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.114.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.114.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.114.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.114.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.115.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.115.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.115.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.115.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.115.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.115.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.116.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.116.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.116.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.116.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.116.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.116.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.117.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.117.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.117.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.117.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.117.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.117.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.118.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.118.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.118.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.118.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.118.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.118.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.119.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.119.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.119.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.119.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.119.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.119.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.120.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.120.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.120.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.120.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.120.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.120.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.121.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.121.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.121.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.121.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.121.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.121.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.122.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.122.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.122.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.122.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.122.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.122.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.123.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.123.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.123.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.123.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.123.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.123.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.124.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.124.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.124.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.124.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.124.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.124.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.125.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.125.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.125.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.125.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.125.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.125.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.126.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.126.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.126.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.126.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.126.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.126.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.127.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.127.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.127.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.127.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.127.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.127.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.128.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.128.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.128.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.128.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.128.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.128.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.129.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.129.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.129.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.129.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.129.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.129.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.130.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.130.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.130.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.130.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.130.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.130.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.131.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.131.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.131.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.131.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.131.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.131.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.132.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.132.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.132.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.132.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.132.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.132.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.133.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.133.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.133.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.133.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.133.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.133.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.134.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.134.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.134.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.134.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.134.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.134.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.135.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.135.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.135.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.135.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.135.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.135.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.136.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.136.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.136.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.136.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.136.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.136.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.137.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.137.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.137.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.137.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.137.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.137.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.138.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.138.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.138.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.138.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.138.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.138.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.139.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.139.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.139.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.139.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.139.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.139.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.140.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.140.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.140.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.140.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.140.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.140.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.141.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.141.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.141.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.141.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.141.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.141.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.142.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.142.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.142.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.142.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.142.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.142.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.143.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.143.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.143.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.143.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.143.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.143.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.144.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.144.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.144.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.144.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.144.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.144.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.145.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.145.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.145.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.145.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.145.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.145.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.146.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.146.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.146.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.146.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.146.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.146.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.147.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.147.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.147.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.147.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.147.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.147.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.148.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.148.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.148.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.148.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.148.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.148.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.149.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.149.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.149.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.149.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.149.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.149.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.150.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.150.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.150.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.150.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.150.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.150.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.151.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.151.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.151.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.151.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.151.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.151.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.152.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.152.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.152.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.152.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.152.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.152.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.153.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.153.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.153.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.153.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.153.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.153.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.154.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.154.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.154.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.154.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.154.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.154.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.155.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.155.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.155.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.155.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.155.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.155.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.156.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.156.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.156.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.156.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.156.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.156.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.157.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.157.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.157.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.157.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.157.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.157.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.158.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.158.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.158.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.158.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.158.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.158.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.159.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.159.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.159.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.159.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.159.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.159.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.160.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.160.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.160.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.160.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.160.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.160.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.161.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.161.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.161.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.161.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.161.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.161.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.162.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.162.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.162.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.162.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.162.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.162.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.163.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.163.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.163.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.163.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.163.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.163.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.164.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.164.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.164.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.164.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.164.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.164.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.165.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.165.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.165.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.165.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.165.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.165.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.166.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.166.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.166.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.166.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.166.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.166.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.167.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.167.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.167.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.167.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.167.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.167.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.168.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.168.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.168.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.168.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.168.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.168.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.169.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.169.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.169.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.169.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.169.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.169.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.170.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.170.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.170.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.170.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.170.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.170.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.171.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.171.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.171.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.171.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.171.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.171.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.172.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.172.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.172.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.172.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.172.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.172.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.173.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.173.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.173.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.173.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.173.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.173.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.174.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.174.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.174.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.174.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.174.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.174.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.175.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.175.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.175.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.175.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.175.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.175.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.176.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.176.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.176.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.176.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.176.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.176.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.177.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.177.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.177.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.177.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.177.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.177.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.178.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.178.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.178.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.178.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.178.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.178.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.179.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.179.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.179.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.179.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.179.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.179.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.180.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.180.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.180.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.180.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.180.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.180.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.181.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.181.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.181.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.181.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.181.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.181.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.182.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.182.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.182.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.182.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.182.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.182.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.183.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.183.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.183.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.183.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.183.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.183.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.184.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.184.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.184.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.184.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.184.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.184.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.185.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.185.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.185.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.185.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.185.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.185.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.186.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.186.gate_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.186.up_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.186.up_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.186.down_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.186.down_proj.weight_scale_inv": "model-00088-of-000163.safetensors", "model.layers.34.mlp.experts.187.gate_proj.weight": "model-00088-of-000163.safetensors", - "model.layers.34.mlp.experts.187.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.187.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.187.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.187.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.187.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.188.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.188.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.188.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.188.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.188.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.188.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.189.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.189.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.189.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.189.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.189.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.189.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.190.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.190.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.190.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.190.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.190.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.190.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.191.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.191.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.191.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.191.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.191.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.191.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.192.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.192.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.192.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.192.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.192.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.192.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.193.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.193.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.193.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.193.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.193.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.193.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.194.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.194.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.194.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.194.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.194.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.194.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.195.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.195.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.195.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.195.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.195.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.195.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.196.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.196.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.196.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.196.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.196.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.196.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.197.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.197.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.197.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.197.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.197.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.197.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.198.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.198.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.198.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.198.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.198.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.198.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.199.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.199.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.199.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.199.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.199.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.199.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.200.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.200.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.200.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.200.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.200.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.200.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.201.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.201.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.201.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.201.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.201.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.201.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.202.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.202.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.202.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.202.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.202.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.202.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.203.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.203.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.203.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.203.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.203.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.203.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.204.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.204.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.204.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.204.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.204.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.204.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.205.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.205.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.205.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.205.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.205.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.205.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.206.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.206.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.206.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.206.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.206.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.206.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.207.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.207.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.207.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.207.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.207.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.207.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.208.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.208.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.208.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.208.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.208.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.208.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.209.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.209.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.209.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.209.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.209.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.209.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.210.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.210.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.210.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.210.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.210.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.210.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.211.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.211.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.211.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.211.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.211.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.211.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.212.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.212.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.212.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.212.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.212.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.212.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.213.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.213.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.213.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.213.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.213.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.213.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.214.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.214.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.214.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.214.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.214.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.214.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.215.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.215.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.215.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.215.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.215.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.215.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.216.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.216.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.216.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.216.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.216.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.216.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.217.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.217.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.217.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.217.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.217.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.217.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.218.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.218.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.218.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.218.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.218.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.218.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.219.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.219.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.219.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.219.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.219.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.219.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.220.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.220.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.220.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.220.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.220.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.220.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.221.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.221.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.221.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.221.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.221.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.221.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.222.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.222.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.222.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.222.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.222.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.222.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.223.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.223.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.223.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.223.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.223.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.223.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.224.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.224.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.224.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.224.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.224.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.224.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.225.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.225.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.225.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.225.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.225.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.225.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.226.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.226.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.226.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.226.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.226.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.226.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.227.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.227.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.227.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.227.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.227.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.227.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.228.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.228.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.228.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.228.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.228.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.228.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.229.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.229.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.229.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.229.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.229.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.229.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.230.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.230.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.230.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.230.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.230.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.230.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.231.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.231.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.231.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.231.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.231.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.231.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.232.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.232.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.232.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.232.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.232.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.232.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.233.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.233.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.233.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.233.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.233.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.233.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.234.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.234.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.234.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.234.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.234.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.234.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.235.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.235.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.235.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.235.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.235.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.235.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.236.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.236.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.236.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.236.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.236.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.236.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.237.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.237.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.237.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.237.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.237.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.237.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.238.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.238.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.238.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.238.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.238.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.238.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.239.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.239.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.239.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.239.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.239.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.239.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.240.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.240.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.240.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.240.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.240.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.240.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.241.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.241.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.241.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.241.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.241.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.241.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.242.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.242.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.242.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.242.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.242.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.242.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.243.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.243.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.243.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.243.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.243.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.243.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.244.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.244.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.244.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.244.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.244.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.244.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.245.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.245.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.245.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.245.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.245.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.245.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.246.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.246.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.246.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.246.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.246.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.246.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.247.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.247.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.247.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.247.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.247.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.247.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.248.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.248.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.248.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.248.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.248.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.248.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.249.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.249.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.249.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.249.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.249.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.249.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.250.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.250.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.250.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.250.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.250.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.250.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.251.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.251.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.251.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.251.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.251.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.251.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.252.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.252.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.252.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.252.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.252.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.252.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.253.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.253.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.253.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.253.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.253.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.253.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.254.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.254.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.254.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.254.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.254.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.254.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.255.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.255.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.255.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.255.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.mlp.experts.255.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.34.mlp.experts.255.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.34.input_layernorm.weight": "model-00089-of-000163.safetensors", "model.layers.34.post_attention_layernorm.weight": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.q_a_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.self_attn.q_a_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.q_a_layernorm.weight": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.q_b_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.self_attn.q_b_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.kv_a_proj_with_mqa.weight": "model-00089-of-000163.safetensors", - "model.layers.35.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.kv_a_layernorm.weight": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.kv_b_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.self_attn.kv_b_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.self_attn.o_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.self_attn.o_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.gate.weight": "model-00089-of-000163.safetensors", "model.layers.35.mlp.gate.e_score_correction_bias": "model-00089-of-000163.safetensors", "model.layers.35.mlp.shared_experts.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.shared_experts.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.shared_experts.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.shared_experts.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.shared_experts.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.0.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.0.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.0.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.0.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.0.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.0.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.1.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.1.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.1.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.1.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.1.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.1.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.2.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.2.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.2.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.2.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.2.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.2.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.3.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.3.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.3.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.3.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.3.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.3.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.4.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.4.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.4.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.4.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.4.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.4.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.5.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.5.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.5.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.5.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.5.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.5.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.6.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.6.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.6.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.6.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.6.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.6.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.7.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.7.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.7.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.7.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.7.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.7.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.8.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.8.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.8.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.8.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.8.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.8.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.9.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.9.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.9.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.9.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.9.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.9.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.10.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.10.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.10.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.10.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.10.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.10.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.11.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.11.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.11.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.11.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.11.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.11.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.12.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.12.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.12.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.12.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.12.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.12.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.13.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.13.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.13.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.13.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.13.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.13.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.14.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.14.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.14.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.14.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.14.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.14.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.15.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.15.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.15.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.15.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.15.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.15.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.16.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.16.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.16.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.16.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.16.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.16.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.17.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.17.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.17.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.17.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.17.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.17.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.18.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.18.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.18.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.18.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.18.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.18.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.19.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.19.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.19.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.19.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.19.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.19.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.20.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.20.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.20.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.20.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.20.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.20.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.21.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.21.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.21.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.21.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.21.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.21.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.22.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.22.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.22.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.22.up_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.22.down_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.22.down_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.23.gate_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.23.gate_proj.weight_scale_inv": "model-00089-of-000163.safetensors", "model.layers.35.mlp.experts.23.up_proj.weight": "model-00089-of-000163.safetensors", - "model.layers.35.mlp.experts.23.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.23.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.23.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.24.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.24.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.24.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.24.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.24.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.24.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.25.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.25.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.25.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.25.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.25.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.25.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.26.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.26.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.26.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.26.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.26.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.26.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.27.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.27.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.27.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.27.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.27.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.27.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.28.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.28.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.28.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.28.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.28.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.28.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.29.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.29.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.29.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.29.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.29.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.29.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.30.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.30.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.30.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.30.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.30.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.30.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.31.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.31.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.31.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.31.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.31.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.31.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.32.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.32.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.32.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.32.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.32.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.32.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.33.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.33.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.33.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.33.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.33.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.33.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.34.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.34.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.34.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.34.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.34.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.34.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.35.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.35.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.35.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.35.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.35.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.35.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.36.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.36.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.36.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.36.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.36.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.36.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.37.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.37.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.37.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.37.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.37.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.37.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.38.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.38.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.38.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.38.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.38.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.38.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.39.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.39.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.39.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.39.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.39.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.39.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.40.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.40.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.40.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.40.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.40.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.40.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.41.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.41.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.41.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.41.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.41.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.41.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.42.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.42.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.42.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.42.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.42.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.42.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.43.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.43.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.43.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.43.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.43.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.43.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.44.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.44.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.44.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.44.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.44.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.44.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.45.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.45.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.45.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.45.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.45.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.45.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.46.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.46.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.46.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.46.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.46.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.46.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.47.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.47.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.47.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.47.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.47.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.47.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.48.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.48.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.48.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.48.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.48.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.48.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.49.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.49.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.49.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.49.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.49.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.49.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.50.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.50.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.50.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.50.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.50.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.50.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.51.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.51.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.51.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.51.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.51.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.51.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.52.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.52.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.52.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.52.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.52.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.52.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.53.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.53.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.53.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.53.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.53.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.53.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.54.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.54.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.54.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.54.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.54.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.54.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.55.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.55.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.55.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.55.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.55.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.55.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.56.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.56.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.56.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.56.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.56.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.56.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.57.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.57.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.57.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.57.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.57.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.57.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.58.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.58.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.58.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.58.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.58.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.58.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.59.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.59.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.59.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.59.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.59.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.59.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.60.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.60.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.60.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.60.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.60.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.60.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.61.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.61.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.61.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.61.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.61.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.61.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.62.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.62.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.62.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.62.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.62.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.62.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.63.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.63.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.63.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.63.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.63.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.63.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.64.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.64.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.64.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.64.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.64.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.64.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.65.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.65.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.65.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.65.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.65.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.65.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.66.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.66.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.66.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.66.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.66.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.66.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.67.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.67.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.67.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.67.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.67.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.67.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.68.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.68.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.68.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.68.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.68.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.68.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.69.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.69.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.69.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.69.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.69.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.69.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.70.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.70.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.70.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.70.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.70.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.70.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.71.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.71.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.71.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.71.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.71.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.71.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.72.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.72.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.72.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.72.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.72.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.72.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.73.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.73.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.73.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.73.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.73.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.73.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.74.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.74.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.74.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.74.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.74.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.74.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.75.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.75.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.75.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.75.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.75.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.75.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.76.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.76.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.76.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.76.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.76.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.76.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.77.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.77.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.77.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.77.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.77.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.77.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.78.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.78.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.78.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.78.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.78.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.78.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.79.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.79.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.79.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.79.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.79.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.79.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.80.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.80.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.80.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.80.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.80.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.80.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.81.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.81.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.81.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.81.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.81.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.81.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.82.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.82.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.82.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.82.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.82.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.82.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.83.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.83.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.83.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.83.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.83.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.83.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.84.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.84.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.84.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.84.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.84.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.84.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.85.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.85.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.85.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.85.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.85.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.85.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.86.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.86.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.86.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.86.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.86.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.86.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.87.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.87.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.87.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.87.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.87.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.87.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.88.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.88.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.88.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.88.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.88.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.88.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.89.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.89.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.89.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.89.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.89.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.89.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.90.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.90.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.90.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.90.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.90.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.90.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.91.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.91.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.91.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.91.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.91.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.91.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.92.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.92.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.92.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.92.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.92.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.92.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.93.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.93.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.93.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.93.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.93.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.93.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.94.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.94.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.94.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.94.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.94.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.94.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.95.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.95.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.95.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.95.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.95.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.95.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.96.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.96.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.96.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.96.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.96.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.96.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.97.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.97.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.97.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.97.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.97.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.97.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.98.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.98.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.98.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.98.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.98.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.98.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.99.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.99.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.99.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.99.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.99.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.99.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.100.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.100.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.100.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.100.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.100.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.100.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.101.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.101.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.101.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.101.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.101.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.101.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.102.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.102.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.102.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.102.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.102.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.102.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.103.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.103.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.103.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.103.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.103.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.103.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.104.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.104.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.104.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.104.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.104.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.104.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.105.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.105.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.105.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.105.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.105.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.105.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.106.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.106.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.106.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.106.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.106.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.106.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.107.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.107.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.107.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.107.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.107.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.107.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.108.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.108.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.108.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.108.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.108.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.108.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.109.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.109.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.109.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.109.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.109.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.109.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.110.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.110.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.110.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.110.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.110.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.110.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.111.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.111.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.111.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.111.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.111.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.111.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.112.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.112.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.112.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.112.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.112.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.112.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.113.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.113.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.113.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.113.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.113.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.113.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.114.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.114.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.114.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.114.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.114.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.114.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.115.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.115.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.115.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.115.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.115.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.115.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.116.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.116.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.116.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.116.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.116.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.116.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.117.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.117.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.117.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.117.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.117.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.117.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.118.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.118.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.118.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.118.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.118.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.118.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.119.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.119.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.119.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.119.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.119.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.119.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.120.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.120.gate_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.120.up_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.120.up_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.120.down_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.120.down_proj.weight_scale_inv": "model-00090-of-000163.safetensors", "model.layers.35.mlp.experts.121.gate_proj.weight": "model-00090-of-000163.safetensors", - "model.layers.35.mlp.experts.121.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.121.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.121.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.121.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.121.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.122.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.122.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.122.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.122.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.122.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.122.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.123.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.123.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.123.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.123.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.123.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.123.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.124.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.124.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.124.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.124.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.124.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.124.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.125.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.125.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.125.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.125.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.125.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.125.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.126.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.126.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.126.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.126.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.126.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.126.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.127.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.127.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.127.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.127.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.127.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.127.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.128.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.128.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.128.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.128.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.128.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.128.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.129.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.129.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.129.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.129.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.129.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.129.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.130.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.130.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.130.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.130.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.130.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.130.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.131.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.131.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.131.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.131.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.131.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.131.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.132.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.132.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.132.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.132.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.132.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.132.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.133.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.133.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.133.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.133.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.133.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.133.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.134.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.134.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.134.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.134.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.134.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.134.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.135.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.135.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.135.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.135.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.135.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.135.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.136.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.136.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.136.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.136.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.136.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.136.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.137.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.137.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.137.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.137.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.137.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.137.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.138.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.138.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.138.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.138.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.138.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.138.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.139.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.139.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.139.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.139.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.139.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.139.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.140.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.140.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.140.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.140.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.140.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.140.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.141.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.141.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.141.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.141.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.141.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.141.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.142.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.142.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.142.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.142.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.142.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.142.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.143.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.143.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.143.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.143.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.143.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.143.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.144.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.144.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.144.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.144.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.144.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.144.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.145.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.145.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.145.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.145.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.145.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.145.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.146.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.146.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.146.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.146.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.146.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.146.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.147.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.147.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.147.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.147.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.147.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.147.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.148.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.148.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.148.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.148.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.148.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.148.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.149.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.149.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.149.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.149.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.149.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.149.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.150.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.150.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.150.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.150.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.150.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.150.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.151.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.151.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.151.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.151.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.151.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.151.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.152.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.152.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.152.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.152.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.152.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.152.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.153.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.153.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.153.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.153.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.153.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.153.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.154.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.154.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.154.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.154.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.154.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.154.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.155.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.155.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.155.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.155.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.155.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.155.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.156.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.156.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.156.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.156.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.156.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.156.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.157.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.157.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.157.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.157.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.157.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.157.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.158.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.158.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.158.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.158.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.158.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.158.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.159.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.159.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.159.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.159.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.159.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.159.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.160.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.160.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.160.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.160.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.160.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.160.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.161.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.161.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.161.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.161.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.161.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.161.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.162.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.162.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.162.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.162.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.162.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.162.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.163.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.163.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.163.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.163.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.163.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.163.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.164.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.164.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.164.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.164.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.164.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.164.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.165.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.165.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.165.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.165.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.165.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.165.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.166.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.166.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.166.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.166.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.166.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.166.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.167.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.167.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.167.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.167.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.167.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.167.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.168.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.168.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.168.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.168.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.168.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.168.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.169.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.169.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.169.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.169.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.169.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.169.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.170.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.170.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.170.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.170.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.170.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.170.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.171.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.171.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.171.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.171.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.171.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.171.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.172.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.172.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.172.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.172.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.172.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.172.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.173.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.173.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.173.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.173.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.173.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.173.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.174.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.174.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.174.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.174.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.174.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.174.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.175.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.175.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.175.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.175.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.175.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.175.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.176.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.176.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.176.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.176.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.176.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.176.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.177.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.177.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.177.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.177.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.177.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.177.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.178.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.178.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.178.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.178.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.178.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.178.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.179.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.179.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.179.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.179.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.179.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.179.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.180.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.180.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.180.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.180.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.180.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.180.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.181.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.181.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.181.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.181.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.181.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.181.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.182.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.182.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.182.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.182.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.182.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.182.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.183.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.183.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.183.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.183.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.183.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.183.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.184.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.184.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.184.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.184.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.184.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.184.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.185.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.185.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.185.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.185.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.185.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.185.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.186.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.186.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.186.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.186.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.186.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.186.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.187.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.187.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.187.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.187.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.187.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.187.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.188.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.188.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.188.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.188.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.188.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.188.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.189.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.189.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.189.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.189.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.189.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.189.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.190.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.190.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.190.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.190.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.190.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.190.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.191.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.191.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.191.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.191.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.191.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.191.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.192.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.192.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.192.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.192.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.192.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.192.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.193.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.193.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.193.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.193.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.193.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.193.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.194.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.194.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.194.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.194.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.194.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.194.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.195.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.195.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.195.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.195.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.195.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.195.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.196.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.196.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.196.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.196.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.196.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.196.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.197.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.197.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.197.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.197.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.197.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.197.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.198.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.198.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.198.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.198.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.198.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.198.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.199.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.199.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.199.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.199.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.199.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.199.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.200.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.200.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.200.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.200.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.200.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.200.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.201.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.201.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.201.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.201.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.201.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.201.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.202.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.202.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.202.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.202.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.202.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.202.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.203.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.203.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.203.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.203.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.203.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.203.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.204.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.204.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.204.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.204.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.204.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.204.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.205.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.205.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.205.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.205.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.205.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.205.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.206.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.206.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.206.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.206.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.206.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.206.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.207.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.207.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.207.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.207.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.207.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.207.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.208.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.208.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.208.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.208.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.208.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.208.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.209.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.209.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.209.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.209.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.209.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.209.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.210.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.210.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.210.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.210.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.210.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.210.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.211.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.211.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.211.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.211.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.211.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.211.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.212.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.212.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.212.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.212.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.212.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.212.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.213.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.213.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.213.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.213.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.213.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.213.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.214.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.214.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.214.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.214.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.214.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.214.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.215.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.215.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.215.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.215.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.215.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.215.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.216.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.216.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.216.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.216.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.216.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.216.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.217.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.217.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.217.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.217.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.217.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.217.down_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.218.gate_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.218.gate_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.218.up_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.218.up_proj.weight_scale_inv": "model-00091-of-000163.safetensors", "model.layers.35.mlp.experts.218.down_proj.weight": "model-00091-of-000163.safetensors", - "model.layers.35.mlp.experts.218.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.219.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.219.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.219.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.219.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.219.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.219.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.220.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.220.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.220.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.220.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.220.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.220.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.221.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.221.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.221.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.221.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.221.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.221.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.222.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.222.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.222.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.222.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.222.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.222.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.223.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.223.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.223.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.223.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.223.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.223.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.224.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.224.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.224.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.224.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.224.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.224.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.225.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.225.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.225.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.225.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.225.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.225.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.226.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.226.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.226.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.226.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.226.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.226.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.227.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.227.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.227.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.227.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.227.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.227.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.228.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.228.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.228.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.228.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.228.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.228.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.229.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.229.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.229.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.229.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.229.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.229.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.230.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.230.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.230.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.230.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.230.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.230.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.231.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.231.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.231.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.231.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.231.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.231.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.232.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.232.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.232.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.232.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.232.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.232.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.233.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.233.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.233.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.233.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.233.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.233.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.234.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.234.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.234.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.234.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.234.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.234.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.235.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.235.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.235.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.235.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.235.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.235.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.236.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.236.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.236.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.236.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.236.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.236.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.237.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.237.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.237.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.237.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.237.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.237.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.238.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.238.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.238.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.238.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.238.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.238.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.239.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.239.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.239.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.239.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.239.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.239.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.240.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.240.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.240.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.240.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.240.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.240.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.241.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.241.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.241.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.241.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.241.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.241.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.242.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.242.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.242.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.242.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.242.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.242.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.243.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.243.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.243.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.243.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.243.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.243.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.244.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.244.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.244.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.244.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.244.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.244.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.245.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.245.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.245.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.245.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.245.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.245.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.246.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.246.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.246.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.246.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.246.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.246.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.247.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.247.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.247.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.247.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.247.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.247.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.248.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.248.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.248.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.248.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.248.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.248.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.249.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.249.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.249.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.249.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.249.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.249.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.250.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.250.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.250.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.250.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.250.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.250.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.251.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.251.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.251.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.251.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.251.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.251.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.252.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.252.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.252.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.252.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.252.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.252.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.253.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.253.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.253.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.253.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.253.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.253.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.254.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.254.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.254.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.254.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.254.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.254.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.255.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.255.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.255.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.255.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.mlp.experts.255.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.35.mlp.experts.255.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.35.input_layernorm.weight": "model-00092-of-000163.safetensors", "model.layers.35.post_attention_layernorm.weight": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.q_a_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.self_attn.q_a_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.q_a_layernorm.weight": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.q_b_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.self_attn.q_b_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.kv_a_proj_with_mqa.weight": "model-00092-of-000163.safetensors", - "model.layers.36.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.kv_a_layernorm.weight": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.kv_b_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.self_attn.kv_b_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.self_attn.o_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.self_attn.o_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.gate.weight": "model-00092-of-000163.safetensors", "model.layers.36.mlp.gate.e_score_correction_bias": "model-00092-of-000163.safetensors", "model.layers.36.mlp.shared_experts.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.shared_experts.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.shared_experts.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.shared_experts.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.shared_experts.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.0.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.0.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.0.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.0.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.0.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.0.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.1.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.1.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.1.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.1.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.1.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.1.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.2.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.2.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.2.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.2.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.2.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.2.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.3.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.3.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.3.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.3.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.3.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.3.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.4.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.4.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.4.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.4.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.4.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.4.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.5.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.5.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.5.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.5.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.5.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.5.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.6.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.6.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.6.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.6.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.6.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.6.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.7.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.7.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.7.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.7.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.7.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.7.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.8.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.8.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.8.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.8.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.8.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.8.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.9.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.9.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.9.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.9.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.9.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.9.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.10.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.10.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.10.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.10.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.10.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.10.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.11.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.11.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.11.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.11.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.11.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.11.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.12.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.12.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.12.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.12.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.12.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.12.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.13.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.13.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.13.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.13.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.13.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.13.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.14.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.14.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.14.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.14.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.14.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.14.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.15.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.15.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.15.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.15.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.15.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.15.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.16.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.16.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.16.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.16.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.16.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.16.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.17.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.17.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.17.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.17.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.17.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.17.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.18.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.18.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.18.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.18.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.18.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.18.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.19.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.19.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.19.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.19.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.19.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.19.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.20.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.20.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.20.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.20.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.20.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.20.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.21.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.21.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.21.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.21.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.21.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.21.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.22.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.22.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.22.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.22.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.22.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.22.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.23.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.23.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.23.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.23.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.23.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.23.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.24.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.24.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.24.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.24.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.24.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.24.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.25.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.25.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.25.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.25.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.25.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.25.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.26.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.26.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.26.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.26.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.26.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.26.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.27.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.27.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.27.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.27.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.27.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.27.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.28.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.28.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.28.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.28.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.28.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.28.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.29.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.29.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.29.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.29.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.29.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.29.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.30.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.30.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.30.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.30.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.30.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.30.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.31.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.31.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.31.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.31.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.31.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.31.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.32.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.32.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.32.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.32.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.32.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.32.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.33.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.33.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.33.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.33.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.33.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.33.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.34.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.34.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.34.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.34.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.34.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.34.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.35.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.35.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.35.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.35.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.35.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.35.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.36.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.36.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.36.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.36.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.36.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.36.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.37.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.37.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.37.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.37.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.37.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.37.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.38.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.38.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.38.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.38.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.38.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.38.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.39.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.39.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.39.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.39.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.39.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.39.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.40.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.40.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.40.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.40.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.40.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.40.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.41.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.41.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.41.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.41.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.41.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.41.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.42.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.42.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.42.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.42.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.42.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.42.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.43.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.43.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.43.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.43.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.43.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.43.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.44.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.44.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.44.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.44.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.44.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.44.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.45.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.45.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.45.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.45.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.45.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.45.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.46.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.46.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.46.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.46.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.46.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.46.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.47.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.47.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.47.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.47.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.47.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.47.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.48.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.48.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.48.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.48.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.48.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.48.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.49.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.49.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.49.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.49.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.49.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.49.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.50.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.50.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.50.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.50.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.50.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.50.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.51.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.51.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.51.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.51.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.51.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.51.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.52.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.52.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.52.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.52.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.52.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.52.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.53.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.53.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.53.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.53.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.53.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.53.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.54.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.54.gate_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.54.up_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.54.up_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.54.down_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.54.down_proj.weight_scale_inv": "model-00092-of-000163.safetensors", "model.layers.36.mlp.experts.55.gate_proj.weight": "model-00092-of-000163.safetensors", - "model.layers.36.mlp.experts.55.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.55.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.55.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.55.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.55.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.56.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.56.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.56.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.56.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.56.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.56.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.57.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.57.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.57.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.57.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.57.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.57.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.58.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.58.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.58.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.58.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.58.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.58.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.59.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.59.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.59.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.59.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.59.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.59.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.60.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.60.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.60.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.60.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.60.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.60.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.61.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.61.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.61.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.61.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.61.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.61.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.62.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.62.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.62.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.62.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.62.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.62.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.63.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.63.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.63.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.63.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.63.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.63.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.64.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.64.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.64.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.64.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.64.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.64.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.65.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.65.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.65.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.65.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.65.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.65.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.66.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.66.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.66.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.66.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.66.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.66.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.67.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.67.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.67.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.67.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.67.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.67.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.68.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.68.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.68.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.68.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.68.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.68.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.69.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.69.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.69.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.69.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.69.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.69.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.70.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.70.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.70.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.70.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.70.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.70.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.71.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.71.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.71.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.71.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.71.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.71.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.72.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.72.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.72.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.72.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.72.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.72.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.73.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.73.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.73.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.73.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.73.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.73.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.74.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.74.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.74.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.74.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.74.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.74.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.75.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.75.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.75.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.75.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.75.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.75.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.76.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.76.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.76.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.76.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.76.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.76.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.77.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.77.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.77.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.77.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.77.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.77.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.78.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.78.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.78.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.78.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.78.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.78.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.79.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.79.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.79.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.79.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.79.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.79.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.80.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.80.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.80.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.80.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.80.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.80.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.81.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.81.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.81.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.81.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.81.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.81.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.82.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.82.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.82.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.82.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.82.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.82.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.83.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.83.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.83.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.83.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.83.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.83.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.84.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.84.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.84.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.84.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.84.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.84.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.85.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.85.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.85.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.85.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.85.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.85.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.86.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.86.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.86.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.86.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.86.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.86.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.87.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.87.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.87.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.87.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.87.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.87.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.88.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.88.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.88.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.88.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.88.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.88.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.89.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.89.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.89.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.89.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.89.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.89.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.90.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.90.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.90.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.90.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.90.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.90.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.91.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.91.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.91.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.91.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.91.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.91.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.92.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.92.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.92.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.92.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.92.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.92.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.93.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.93.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.93.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.93.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.93.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.93.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.94.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.94.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.94.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.94.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.94.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.94.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.95.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.95.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.95.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.95.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.95.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.95.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.96.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.96.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.96.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.96.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.96.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.96.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.97.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.97.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.97.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.97.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.97.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.97.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.98.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.98.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.98.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.98.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.98.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.98.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.99.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.99.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.99.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.99.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.99.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.99.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.100.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.100.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.100.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.100.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.100.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.100.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.101.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.101.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.101.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.101.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.101.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.101.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.102.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.102.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.102.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.102.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.102.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.102.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.103.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.103.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.103.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.103.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.103.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.103.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.104.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.104.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.104.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.104.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.104.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.104.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.105.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.105.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.105.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.105.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.105.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.105.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.106.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.106.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.106.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.106.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.106.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.106.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.107.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.107.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.107.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.107.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.107.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.107.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.108.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.108.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.108.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.108.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.108.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.108.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.109.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.109.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.109.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.109.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.109.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.109.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.110.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.110.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.110.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.110.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.110.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.110.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.111.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.111.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.111.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.111.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.111.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.111.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.112.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.112.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.112.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.112.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.112.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.112.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.113.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.113.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.113.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.113.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.113.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.113.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.114.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.114.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.114.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.114.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.114.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.114.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.115.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.115.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.115.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.115.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.115.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.115.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.116.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.116.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.116.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.116.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.116.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.116.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.117.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.117.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.117.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.117.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.117.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.117.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.118.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.118.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.118.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.118.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.118.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.118.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.119.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.119.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.119.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.119.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.119.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.119.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.120.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.120.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.120.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.120.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.120.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.120.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.121.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.121.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.121.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.121.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.121.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.121.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.122.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.122.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.122.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.122.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.122.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.122.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.123.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.123.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.123.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.123.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.123.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.123.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.124.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.124.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.124.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.124.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.124.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.124.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.125.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.125.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.125.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.125.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.125.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.125.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.126.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.126.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.126.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.126.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.126.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.126.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.127.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.127.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.127.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.127.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.127.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.127.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.128.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.128.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.128.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.128.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.128.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.128.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.129.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.129.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.129.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.129.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.129.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.129.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.130.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.130.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.130.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.130.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.130.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.130.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.131.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.131.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.131.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.131.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.131.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.131.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.132.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.132.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.132.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.132.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.132.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.132.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.133.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.133.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.133.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.133.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.133.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.133.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.134.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.134.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.134.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.134.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.134.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.134.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.135.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.135.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.135.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.135.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.135.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.135.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.136.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.136.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.136.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.136.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.136.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.136.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.137.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.137.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.137.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.137.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.137.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.137.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.138.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.138.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.138.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.138.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.138.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.138.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.139.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.139.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.139.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.139.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.139.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.139.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.140.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.140.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.140.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.140.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.140.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.140.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.141.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.141.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.141.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.141.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.141.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.141.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.142.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.142.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.142.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.142.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.142.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.142.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.143.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.143.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.143.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.143.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.143.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.143.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.144.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.144.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.144.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.144.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.144.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.144.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.145.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.145.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.145.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.145.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.145.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.145.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.146.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.146.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.146.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.146.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.146.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.146.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.147.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.147.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.147.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.147.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.147.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.147.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.148.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.148.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.148.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.148.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.148.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.148.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.149.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.149.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.149.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.149.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.149.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.149.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.150.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.150.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.150.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.150.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.150.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.150.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.151.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.151.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.151.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.151.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.151.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.151.down_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.152.gate_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.152.gate_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.152.up_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.152.up_proj.weight_scale_inv": "model-00093-of-000163.safetensors", "model.layers.36.mlp.experts.152.down_proj.weight": "model-00093-of-000163.safetensors", - "model.layers.36.mlp.experts.152.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.153.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.153.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.153.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.153.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.153.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.153.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.154.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.154.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.154.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.154.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.154.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.154.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.155.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.155.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.155.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.155.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.155.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.155.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.156.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.156.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.156.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.156.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.156.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.156.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.157.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.157.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.157.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.157.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.157.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.157.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.158.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.158.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.158.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.158.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.158.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.158.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.159.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.159.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.159.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.159.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.159.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.159.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.160.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.160.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.160.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.160.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.160.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.160.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.161.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.161.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.161.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.161.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.161.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.161.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.162.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.162.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.162.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.162.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.162.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.162.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.163.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.163.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.163.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.163.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.163.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.163.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.164.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.164.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.164.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.164.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.164.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.164.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.165.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.165.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.165.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.165.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.165.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.165.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.166.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.166.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.166.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.166.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.166.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.166.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.167.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.167.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.167.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.167.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.167.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.167.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.168.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.168.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.168.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.168.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.168.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.168.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.169.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.169.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.169.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.169.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.169.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.169.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.170.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.170.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.170.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.170.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.170.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.170.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.171.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.171.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.171.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.171.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.171.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.171.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.172.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.172.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.172.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.172.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.172.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.172.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.173.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.173.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.173.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.173.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.173.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.173.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.174.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.174.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.174.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.174.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.174.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.174.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.175.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.175.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.175.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.175.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.175.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.175.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.176.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.176.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.176.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.176.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.176.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.176.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.177.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.177.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.177.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.177.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.177.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.177.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.178.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.178.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.178.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.178.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.178.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.178.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.179.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.179.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.179.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.179.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.179.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.179.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.180.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.180.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.180.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.180.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.180.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.180.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.181.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.181.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.181.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.181.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.181.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.181.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.182.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.182.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.182.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.182.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.182.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.182.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.183.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.183.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.183.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.183.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.183.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.183.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.184.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.184.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.184.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.184.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.184.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.184.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.185.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.185.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.185.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.185.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.185.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.185.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.186.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.186.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.186.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.186.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.186.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.186.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.187.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.187.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.187.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.187.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.187.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.187.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.188.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.188.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.188.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.188.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.188.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.188.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.189.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.189.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.189.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.189.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.189.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.189.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.190.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.190.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.190.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.190.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.190.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.190.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.191.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.191.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.191.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.191.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.191.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.191.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.192.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.192.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.192.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.192.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.192.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.192.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.193.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.193.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.193.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.193.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.193.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.193.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.194.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.194.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.194.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.194.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.194.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.194.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.195.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.195.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.195.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.195.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.195.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.195.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.196.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.196.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.196.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.196.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.196.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.196.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.197.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.197.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.197.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.197.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.197.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.197.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.198.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.198.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.198.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.198.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.198.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.198.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.199.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.199.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.199.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.199.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.199.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.199.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.200.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.200.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.200.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.200.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.200.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.200.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.201.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.201.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.201.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.201.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.201.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.201.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.202.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.202.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.202.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.202.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.202.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.202.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.203.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.203.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.203.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.203.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.203.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.203.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.204.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.204.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.204.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.204.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.204.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.204.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.205.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.205.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.205.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.205.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.205.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.205.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.206.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.206.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.206.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.206.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.206.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.206.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.207.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.207.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.207.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.207.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.207.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.207.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.208.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.208.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.208.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.208.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.208.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.208.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.209.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.209.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.209.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.209.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.209.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.209.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.210.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.210.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.210.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.210.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.210.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.210.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.211.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.211.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.211.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.211.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.211.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.211.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.212.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.212.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.212.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.212.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.212.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.212.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.213.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.213.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.213.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.213.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.213.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.213.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.214.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.214.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.214.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.214.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.214.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.214.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.215.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.215.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.215.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.215.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.215.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.215.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.216.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.216.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.216.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.216.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.216.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.216.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.217.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.217.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.217.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.217.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.217.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.217.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.218.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.218.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.218.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.218.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.218.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.218.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.219.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.219.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.219.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.219.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.219.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.219.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.220.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.220.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.220.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.220.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.220.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.220.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.221.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.221.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.221.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.221.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.221.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.221.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.222.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.222.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.222.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.222.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.222.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.222.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.223.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.223.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.223.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.223.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.223.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.223.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.224.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.224.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.224.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.224.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.224.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.224.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.225.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.225.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.225.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.225.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.225.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.225.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.226.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.226.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.226.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.226.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.226.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.226.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.227.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.227.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.227.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.227.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.227.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.227.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.228.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.228.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.228.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.228.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.228.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.228.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.229.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.229.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.229.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.229.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.229.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.229.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.230.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.230.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.230.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.230.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.230.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.230.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.231.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.231.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.231.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.231.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.231.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.231.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.232.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.232.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.232.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.232.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.232.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.232.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.233.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.233.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.233.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.233.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.233.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.233.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.234.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.234.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.234.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.234.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.234.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.234.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.235.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.235.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.235.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.235.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.235.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.235.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.236.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.236.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.236.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.236.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.236.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.236.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.237.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.237.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.237.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.237.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.237.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.237.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.238.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.238.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.238.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.238.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.238.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.238.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.239.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.239.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.239.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.239.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.239.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.239.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.240.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.240.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.240.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.240.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.240.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.240.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.241.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.241.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.241.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.241.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.241.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.241.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.242.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.242.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.242.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.242.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.242.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.242.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.243.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.243.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.243.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.243.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.243.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.243.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.244.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.244.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.244.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.244.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.244.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.244.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.245.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.245.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.245.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.245.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.245.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.245.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.246.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.246.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.246.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.246.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.246.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.246.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.247.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.247.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.247.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.247.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.247.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.247.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.248.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.248.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.248.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.248.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.248.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.248.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.249.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.249.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.249.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.249.up_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.249.down_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.249.down_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.250.gate_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.250.gate_proj.weight_scale_inv": "model-00094-of-000163.safetensors", "model.layers.36.mlp.experts.250.up_proj.weight": "model-00094-of-000163.safetensors", - "model.layers.36.mlp.experts.250.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.250.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.250.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.251.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.251.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.251.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.251.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.251.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.251.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.252.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.252.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.252.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.252.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.252.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.252.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.253.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.253.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.253.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.253.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.253.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.253.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.254.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.254.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.254.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.254.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.254.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.254.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.255.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.255.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.255.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.255.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.mlp.experts.255.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.36.mlp.experts.255.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.36.input_layernorm.weight": "model-00095-of-000163.safetensors", "model.layers.36.post_attention_layernorm.weight": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.q_a_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.self_attn.q_a_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.q_a_layernorm.weight": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.q_b_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.self_attn.q_b_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.kv_a_proj_with_mqa.weight": "model-00095-of-000163.safetensors", - "model.layers.37.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.kv_a_layernorm.weight": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.kv_b_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.self_attn.kv_b_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.self_attn.o_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.self_attn.o_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.gate.weight": "model-00095-of-000163.safetensors", "model.layers.37.mlp.gate.e_score_correction_bias": "model-00095-of-000163.safetensors", "model.layers.37.mlp.shared_experts.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.shared_experts.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.shared_experts.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.shared_experts.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.shared_experts.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.0.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.0.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.0.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.0.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.0.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.0.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.1.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.1.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.1.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.1.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.1.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.1.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.2.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.2.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.2.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.2.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.2.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.2.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.3.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.3.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.3.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.3.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.3.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.3.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.4.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.4.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.4.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.4.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.4.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.4.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.5.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.5.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.5.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.5.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.5.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.5.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.6.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.6.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.6.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.6.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.6.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.6.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.7.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.7.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.7.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.7.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.7.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.7.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.8.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.8.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.8.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.8.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.8.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.8.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.9.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.9.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.9.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.9.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.9.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.9.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.10.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.10.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.10.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.10.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.10.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.10.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.11.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.11.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.11.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.11.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.11.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.11.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.12.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.12.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.12.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.12.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.12.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.12.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.13.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.13.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.13.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.13.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.13.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.13.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.14.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.14.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.14.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.14.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.14.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.14.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.15.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.15.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.15.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.15.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.15.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.15.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.16.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.16.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.16.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.16.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.16.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.16.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.17.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.17.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.17.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.17.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.17.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.17.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.18.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.18.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.18.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.18.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.18.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.18.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.19.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.19.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.19.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.19.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.19.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.19.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.20.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.20.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.20.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.20.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.20.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.20.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.21.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.21.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.21.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.21.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.21.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.21.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.22.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.22.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.22.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.22.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.22.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.22.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.23.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.23.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.23.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.23.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.23.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.23.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.24.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.24.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.24.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.24.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.24.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.24.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.25.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.25.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.25.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.25.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.25.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.25.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.26.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.26.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.26.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.26.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.26.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.26.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.27.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.27.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.27.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.27.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.27.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.27.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.28.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.28.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.28.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.28.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.28.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.28.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.29.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.29.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.29.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.29.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.29.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.29.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.30.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.30.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.30.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.30.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.30.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.30.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.31.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.31.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.31.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.31.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.31.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.31.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.32.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.32.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.32.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.32.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.32.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.32.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.33.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.33.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.33.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.33.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.33.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.33.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.34.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.34.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.34.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.34.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.34.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.34.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.35.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.35.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.35.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.35.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.35.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.35.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.36.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.36.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.36.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.36.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.36.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.36.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.37.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.37.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.37.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.37.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.37.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.37.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.38.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.38.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.38.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.38.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.38.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.38.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.39.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.39.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.39.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.39.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.39.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.39.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.40.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.40.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.40.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.40.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.40.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.40.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.41.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.41.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.41.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.41.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.41.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.41.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.42.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.42.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.42.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.42.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.42.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.42.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.43.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.43.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.43.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.43.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.43.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.43.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.44.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.44.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.44.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.44.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.44.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.44.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.45.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.45.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.45.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.45.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.45.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.45.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.46.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.46.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.46.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.46.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.46.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.46.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.47.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.47.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.47.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.47.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.47.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.47.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.48.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.48.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.48.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.48.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.48.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.48.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.49.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.49.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.49.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.49.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.49.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.49.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.50.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.50.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.50.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.50.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.50.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.50.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.51.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.51.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.51.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.51.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.51.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.51.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.52.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.52.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.52.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.52.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.52.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.52.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.53.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.53.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.53.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.53.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.53.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.53.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.54.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.54.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.54.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.54.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.54.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.54.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.55.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.55.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.55.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.55.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.55.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.55.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.56.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.56.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.56.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.56.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.56.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.56.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.57.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.57.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.57.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.57.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.57.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.57.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.58.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.58.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.58.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.58.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.58.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.58.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.59.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.59.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.59.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.59.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.59.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.59.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.60.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.60.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.60.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.60.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.60.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.60.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.61.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.61.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.61.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.61.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.61.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.61.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.62.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.62.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.62.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.62.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.62.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.62.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.63.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.63.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.63.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.63.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.63.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.63.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.64.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.64.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.64.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.64.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.64.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.64.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.65.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.65.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.65.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.65.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.65.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.65.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.66.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.66.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.66.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.66.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.66.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.66.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.67.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.67.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.67.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.67.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.67.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.67.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.68.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.68.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.68.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.68.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.68.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.68.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.69.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.69.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.69.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.69.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.69.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.69.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.70.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.70.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.70.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.70.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.70.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.70.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.71.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.71.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.71.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.71.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.71.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.71.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.72.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.72.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.72.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.72.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.72.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.72.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.73.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.73.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.73.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.73.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.73.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.73.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.74.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.74.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.74.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.74.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.74.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.74.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.75.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.75.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.75.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.75.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.75.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.75.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.76.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.76.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.76.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.76.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.76.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.76.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.77.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.77.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.77.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.77.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.77.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.77.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.78.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.78.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.78.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.78.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.78.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.78.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.79.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.79.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.79.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.79.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.79.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.79.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.80.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.80.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.80.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.80.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.80.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.80.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.81.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.81.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.81.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.81.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.81.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.81.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.82.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.82.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.82.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.82.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.82.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.82.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.83.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.83.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.83.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.83.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.83.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.83.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.84.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.84.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.84.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.84.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.84.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.84.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.85.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.85.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.85.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.85.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.85.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.85.down_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.86.gate_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.86.gate_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.86.up_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.86.up_proj.weight_scale_inv": "model-00095-of-000163.safetensors", "model.layers.37.mlp.experts.86.down_proj.weight": "model-00095-of-000163.safetensors", - "model.layers.37.mlp.experts.86.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.87.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.87.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.87.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.87.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.87.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.87.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.88.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.88.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.88.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.88.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.88.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.88.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.89.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.89.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.89.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.89.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.89.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.89.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.90.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.90.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.90.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.90.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.90.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.90.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.91.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.91.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.91.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.91.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.91.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.91.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.92.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.92.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.92.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.92.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.92.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.92.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.93.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.93.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.93.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.93.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.93.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.93.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.94.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.94.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.94.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.94.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.94.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.94.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.95.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.95.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.95.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.95.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.95.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.95.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.96.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.96.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.96.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.96.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.96.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.96.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.97.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.97.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.97.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.97.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.97.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.97.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.98.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.98.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.98.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.98.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.98.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.98.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.99.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.99.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.99.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.99.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.99.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.99.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.100.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.100.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.100.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.100.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.100.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.100.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.101.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.101.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.101.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.101.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.101.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.101.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.102.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.102.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.102.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.102.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.102.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.102.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.103.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.103.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.103.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.103.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.103.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.103.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.104.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.104.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.104.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.104.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.104.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.104.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.105.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.105.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.105.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.105.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.105.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.105.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.106.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.106.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.106.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.106.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.106.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.106.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.107.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.107.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.107.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.107.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.107.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.107.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.108.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.108.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.108.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.108.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.108.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.108.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.109.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.109.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.109.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.109.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.109.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.109.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.110.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.110.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.110.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.110.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.110.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.110.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.111.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.111.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.111.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.111.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.111.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.111.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.112.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.112.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.112.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.112.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.112.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.112.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.113.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.113.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.113.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.113.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.113.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.113.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.114.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.114.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.114.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.114.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.114.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.114.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.115.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.115.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.115.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.115.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.115.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.115.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.116.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.116.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.116.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.116.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.116.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.116.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.117.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.117.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.117.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.117.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.117.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.117.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.118.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.118.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.118.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.118.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.118.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.118.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.119.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.119.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.119.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.119.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.119.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.119.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.120.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.120.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.120.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.120.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.120.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.120.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.121.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.121.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.121.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.121.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.121.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.121.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.122.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.122.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.122.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.122.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.122.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.122.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.123.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.123.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.123.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.123.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.123.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.123.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.124.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.124.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.124.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.124.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.124.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.124.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.125.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.125.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.125.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.125.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.125.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.125.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.126.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.126.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.126.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.126.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.126.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.126.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.127.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.127.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.127.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.127.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.127.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.127.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.128.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.128.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.128.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.128.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.128.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.128.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.129.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.129.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.129.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.129.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.129.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.129.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.130.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.130.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.130.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.130.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.130.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.130.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.131.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.131.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.131.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.131.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.131.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.131.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.132.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.132.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.132.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.132.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.132.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.132.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.133.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.133.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.133.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.133.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.133.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.133.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.134.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.134.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.134.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.134.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.134.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.134.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.135.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.135.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.135.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.135.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.135.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.135.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.136.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.136.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.136.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.136.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.136.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.136.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.137.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.137.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.137.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.137.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.137.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.137.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.138.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.138.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.138.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.138.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.138.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.138.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.139.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.139.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.139.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.139.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.139.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.139.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.140.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.140.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.140.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.140.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.140.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.140.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.141.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.141.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.141.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.141.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.141.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.141.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.142.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.142.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.142.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.142.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.142.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.142.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.143.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.143.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.143.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.143.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.143.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.143.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.144.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.144.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.144.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.144.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.144.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.144.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.145.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.145.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.145.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.145.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.145.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.145.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.146.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.146.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.146.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.146.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.146.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.146.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.147.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.147.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.147.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.147.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.147.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.147.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.148.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.148.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.148.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.148.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.148.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.148.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.149.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.149.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.149.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.149.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.149.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.149.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.150.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.150.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.150.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.150.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.150.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.150.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.151.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.151.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.151.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.151.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.151.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.151.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.152.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.152.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.152.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.152.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.152.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.152.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.153.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.153.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.153.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.153.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.153.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.153.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.154.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.154.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.154.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.154.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.154.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.154.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.155.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.155.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.155.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.155.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.155.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.155.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.156.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.156.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.156.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.156.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.156.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.156.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.157.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.157.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.157.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.157.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.157.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.157.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.158.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.158.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.158.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.158.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.158.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.158.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.159.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.159.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.159.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.159.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.159.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.159.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.160.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.160.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.160.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.160.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.160.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.160.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.161.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.161.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.161.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.161.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.161.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.161.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.162.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.162.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.162.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.162.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.162.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.162.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.163.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.163.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.163.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.163.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.163.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.163.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.164.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.164.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.164.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.164.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.164.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.164.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.165.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.165.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.165.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.165.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.165.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.165.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.166.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.166.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.166.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.166.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.166.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.166.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.167.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.167.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.167.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.167.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.167.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.167.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.168.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.168.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.168.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.168.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.168.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.168.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.169.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.169.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.169.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.169.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.169.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.169.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.170.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.170.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.170.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.170.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.170.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.170.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.171.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.171.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.171.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.171.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.171.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.171.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.172.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.172.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.172.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.172.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.172.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.172.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.173.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.173.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.173.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.173.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.173.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.173.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.174.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.174.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.174.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.174.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.174.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.174.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.175.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.175.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.175.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.175.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.175.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.175.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.176.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.176.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.176.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.176.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.176.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.176.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.177.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.177.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.177.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.177.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.177.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.177.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.178.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.178.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.178.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.178.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.178.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.178.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.179.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.179.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.179.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.179.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.179.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.179.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.180.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.180.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.180.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.180.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.180.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.180.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.181.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.181.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.181.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.181.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.181.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.181.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.182.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.182.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.182.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.182.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.182.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.182.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.183.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.183.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.183.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.183.up_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.183.down_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.183.down_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.184.gate_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.184.gate_proj.weight_scale_inv": "model-00096-of-000163.safetensors", "model.layers.37.mlp.experts.184.up_proj.weight": "model-00096-of-000163.safetensors", - "model.layers.37.mlp.experts.184.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.184.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.184.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.185.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.185.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.185.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.185.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.185.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.185.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.186.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.186.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.186.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.186.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.186.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.186.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.187.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.187.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.187.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.187.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.187.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.187.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.188.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.188.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.188.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.188.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.188.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.188.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.189.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.189.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.189.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.189.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.189.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.189.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.190.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.190.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.190.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.190.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.190.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.190.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.191.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.191.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.191.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.191.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.191.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.191.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.192.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.192.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.192.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.192.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.192.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.192.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.193.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.193.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.193.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.193.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.193.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.193.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.194.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.194.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.194.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.194.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.194.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.194.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.195.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.195.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.195.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.195.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.195.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.195.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.196.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.196.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.196.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.196.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.196.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.196.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.197.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.197.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.197.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.197.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.197.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.197.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.198.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.198.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.198.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.198.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.198.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.198.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.199.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.199.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.199.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.199.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.199.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.199.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.200.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.200.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.200.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.200.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.200.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.200.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.201.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.201.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.201.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.201.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.201.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.201.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.202.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.202.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.202.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.202.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.202.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.202.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.203.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.203.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.203.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.203.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.203.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.203.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.204.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.204.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.204.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.204.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.204.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.204.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.205.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.205.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.205.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.205.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.205.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.205.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.206.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.206.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.206.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.206.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.206.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.206.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.207.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.207.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.207.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.207.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.207.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.207.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.208.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.208.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.208.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.208.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.208.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.208.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.209.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.209.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.209.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.209.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.209.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.209.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.210.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.210.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.210.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.210.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.210.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.210.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.211.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.211.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.211.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.211.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.211.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.211.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.212.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.212.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.212.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.212.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.212.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.212.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.213.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.213.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.213.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.213.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.213.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.213.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.214.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.214.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.214.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.214.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.214.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.214.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.215.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.215.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.215.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.215.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.215.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.215.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.216.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.216.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.216.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.216.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.216.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.216.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.217.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.217.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.217.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.217.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.217.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.217.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.218.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.218.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.218.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.218.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.218.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.218.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.219.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.219.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.219.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.219.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.219.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.219.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.220.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.220.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.220.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.220.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.220.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.220.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.221.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.221.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.221.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.221.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.221.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.221.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.222.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.222.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.222.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.222.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.222.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.222.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.223.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.223.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.223.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.223.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.223.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.223.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.224.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.224.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.224.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.224.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.224.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.224.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.225.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.225.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.225.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.225.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.225.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.225.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.226.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.226.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.226.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.226.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.226.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.226.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.227.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.227.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.227.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.227.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.227.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.227.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.228.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.228.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.228.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.228.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.228.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.228.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.229.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.229.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.229.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.229.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.229.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.229.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.230.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.230.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.230.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.230.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.230.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.230.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.231.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.231.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.231.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.231.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.231.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.231.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.232.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.232.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.232.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.232.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.232.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.232.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.233.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.233.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.233.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.233.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.233.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.233.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.234.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.234.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.234.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.234.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.234.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.234.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.235.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.235.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.235.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.235.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.235.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.235.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.236.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.236.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.236.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.236.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.236.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.236.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.237.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.237.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.237.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.237.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.237.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.237.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.238.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.238.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.238.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.238.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.238.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.238.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.239.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.239.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.239.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.239.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.239.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.239.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.240.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.240.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.240.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.240.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.240.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.240.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.241.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.241.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.241.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.241.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.241.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.241.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.242.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.242.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.242.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.242.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.242.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.242.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.243.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.243.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.243.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.243.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.243.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.243.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.244.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.244.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.244.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.244.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.244.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.244.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.245.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.245.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.245.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.245.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.245.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.245.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.246.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.246.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.246.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.246.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.246.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.246.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.247.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.247.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.247.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.247.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.247.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.247.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.248.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.248.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.248.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.248.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.248.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.248.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.249.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.249.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.249.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.249.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.249.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.249.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.250.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.250.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.250.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.250.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.250.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.250.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.251.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.251.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.251.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.251.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.251.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.251.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.252.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.252.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.252.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.252.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.252.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.252.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.253.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.253.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.253.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.253.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.253.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.253.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.254.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.254.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.254.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.254.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.254.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.254.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.255.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.255.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.255.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.255.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.mlp.experts.255.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.37.mlp.experts.255.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.37.input_layernorm.weight": "model-00097-of-000163.safetensors", "model.layers.37.post_attention_layernorm.weight": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.q_a_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.self_attn.q_a_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.q_a_layernorm.weight": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.q_b_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.self_attn.q_b_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.kv_a_proj_with_mqa.weight": "model-00097-of-000163.safetensors", - "model.layers.38.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.kv_a_layernorm.weight": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.kv_b_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.self_attn.kv_b_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.self_attn.o_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.self_attn.o_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.gate.weight": "model-00097-of-000163.safetensors", "model.layers.38.mlp.gate.e_score_correction_bias": "model-00097-of-000163.safetensors", "model.layers.38.mlp.shared_experts.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.shared_experts.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.shared_experts.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.shared_experts.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.shared_experts.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.0.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.0.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.0.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.0.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.0.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.0.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.1.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.1.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.1.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.1.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.1.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.1.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.2.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.2.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.2.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.2.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.2.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.2.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.3.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.3.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.3.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.3.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.3.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.3.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.4.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.4.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.4.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.4.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.4.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.4.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.5.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.5.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.5.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.5.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.5.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.5.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.6.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.6.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.6.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.6.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.6.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.6.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.7.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.7.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.7.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.7.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.7.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.7.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.8.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.8.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.8.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.8.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.8.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.8.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.9.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.9.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.9.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.9.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.9.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.9.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.10.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.10.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.10.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.10.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.10.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.10.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.11.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.11.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.11.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.11.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.11.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.11.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.12.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.12.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.12.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.12.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.12.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.12.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.13.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.13.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.13.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.13.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.13.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.13.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.14.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.14.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.14.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.14.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.14.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.14.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.15.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.15.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.15.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.15.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.15.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.15.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.16.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.16.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.16.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.16.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.16.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.16.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.17.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.17.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.17.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.17.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.17.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.17.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.18.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.18.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.18.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.18.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.18.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.18.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.19.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.19.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.19.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.19.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.19.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.19.down_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.20.gate_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.20.gate_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.20.up_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.20.up_proj.weight_scale_inv": "model-00097-of-000163.safetensors", "model.layers.38.mlp.experts.20.down_proj.weight": "model-00097-of-000163.safetensors", - "model.layers.38.mlp.experts.20.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.21.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.21.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.21.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.21.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.21.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.21.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.22.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.22.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.22.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.22.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.22.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.22.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.23.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.23.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.23.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.23.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.23.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.23.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.24.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.24.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.24.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.24.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.24.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.24.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.25.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.25.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.25.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.25.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.25.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.25.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.26.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.26.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.26.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.26.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.26.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.26.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.27.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.27.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.27.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.27.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.27.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.27.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.28.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.28.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.28.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.28.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.28.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.28.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.29.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.29.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.29.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.29.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.29.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.29.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.30.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.30.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.30.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.30.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.30.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.30.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.31.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.31.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.31.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.31.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.31.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.31.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.32.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.32.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.32.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.32.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.32.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.32.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.33.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.33.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.33.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.33.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.33.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.33.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.34.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.34.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.34.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.34.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.34.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.34.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.35.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.35.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.35.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.35.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.35.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.35.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.36.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.36.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.36.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.36.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.36.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.36.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.37.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.37.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.37.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.37.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.37.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.37.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.38.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.38.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.38.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.38.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.38.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.38.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.39.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.39.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.39.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.39.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.39.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.39.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.40.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.40.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.40.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.40.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.40.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.40.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.41.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.41.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.41.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.41.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.41.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.41.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.42.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.42.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.42.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.42.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.42.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.42.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.43.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.43.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.43.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.43.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.43.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.43.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.44.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.44.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.44.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.44.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.44.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.44.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.45.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.45.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.45.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.45.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.45.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.45.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.46.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.46.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.46.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.46.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.46.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.46.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.47.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.47.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.47.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.47.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.47.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.47.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.48.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.48.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.48.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.48.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.48.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.48.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.49.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.49.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.49.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.49.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.49.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.49.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.50.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.50.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.50.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.50.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.50.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.50.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.51.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.51.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.51.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.51.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.51.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.51.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.52.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.52.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.52.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.52.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.52.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.52.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.53.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.53.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.53.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.53.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.53.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.53.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.54.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.54.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.54.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.54.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.54.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.54.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.55.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.55.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.55.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.55.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.55.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.55.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.56.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.56.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.56.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.56.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.56.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.56.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.57.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.57.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.57.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.57.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.57.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.57.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.58.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.58.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.58.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.58.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.58.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.58.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.59.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.59.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.59.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.59.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.59.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.59.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.60.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.60.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.60.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.60.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.60.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.60.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.61.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.61.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.61.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.61.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.61.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.61.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.62.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.62.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.62.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.62.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.62.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.62.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.63.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.63.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.63.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.63.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.63.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.63.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.64.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.64.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.64.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.64.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.64.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.64.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.65.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.65.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.65.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.65.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.65.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.65.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.66.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.66.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.66.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.66.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.66.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.66.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.67.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.67.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.67.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.67.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.67.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.67.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.68.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.68.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.68.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.68.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.68.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.68.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.69.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.69.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.69.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.69.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.69.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.69.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.70.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.70.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.70.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.70.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.70.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.70.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.71.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.71.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.71.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.71.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.71.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.71.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.72.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.72.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.72.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.72.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.72.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.72.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.73.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.73.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.73.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.73.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.73.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.73.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.74.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.74.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.74.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.74.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.74.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.74.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.75.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.75.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.75.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.75.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.75.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.75.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.76.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.76.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.76.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.76.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.76.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.76.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.77.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.77.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.77.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.77.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.77.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.77.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.78.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.78.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.78.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.78.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.78.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.78.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.79.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.79.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.79.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.79.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.79.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.79.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.80.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.80.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.80.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.80.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.80.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.80.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.81.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.81.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.81.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.81.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.81.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.81.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.82.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.82.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.82.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.82.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.82.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.82.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.83.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.83.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.83.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.83.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.83.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.83.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.84.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.84.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.84.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.84.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.84.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.84.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.85.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.85.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.85.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.85.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.85.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.85.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.86.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.86.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.86.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.86.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.86.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.86.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.87.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.87.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.87.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.87.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.87.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.87.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.88.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.88.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.88.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.88.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.88.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.88.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.89.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.89.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.89.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.89.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.89.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.89.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.90.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.90.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.90.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.90.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.90.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.90.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.91.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.91.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.91.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.91.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.91.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.91.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.92.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.92.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.92.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.92.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.92.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.92.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.93.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.93.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.93.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.93.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.93.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.93.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.94.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.94.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.94.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.94.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.94.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.94.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.95.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.95.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.95.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.95.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.95.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.95.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.96.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.96.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.96.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.96.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.96.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.96.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.97.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.97.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.97.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.97.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.97.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.97.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.98.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.98.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.98.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.98.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.98.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.98.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.99.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.99.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.99.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.99.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.99.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.99.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.100.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.100.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.100.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.100.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.100.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.100.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.101.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.101.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.101.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.101.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.101.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.101.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.102.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.102.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.102.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.102.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.102.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.102.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.103.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.103.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.103.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.103.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.103.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.103.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.104.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.104.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.104.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.104.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.104.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.104.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.105.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.105.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.105.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.105.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.105.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.105.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.106.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.106.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.106.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.106.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.106.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.106.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.107.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.107.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.107.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.107.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.107.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.107.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.108.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.108.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.108.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.108.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.108.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.108.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.109.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.109.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.109.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.109.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.109.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.109.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.110.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.110.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.110.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.110.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.110.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.110.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.111.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.111.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.111.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.111.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.111.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.111.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.112.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.112.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.112.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.112.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.112.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.112.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.113.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.113.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.113.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.113.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.113.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.113.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.114.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.114.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.114.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.114.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.114.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.114.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.115.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.115.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.115.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.115.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.115.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.115.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.116.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.116.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.116.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.116.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.116.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.116.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.117.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.117.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.117.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.117.up_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.117.down_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.117.down_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.118.gate_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.118.gate_proj.weight_scale_inv": "model-00098-of-000163.safetensors", "model.layers.38.mlp.experts.118.up_proj.weight": "model-00098-of-000163.safetensors", - "model.layers.38.mlp.experts.118.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.118.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.118.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.119.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.119.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.119.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.119.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.119.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.119.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.120.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.120.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.120.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.120.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.120.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.120.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.121.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.121.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.121.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.121.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.121.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.121.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.122.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.122.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.122.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.122.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.122.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.122.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.123.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.123.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.123.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.123.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.123.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.123.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.124.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.124.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.124.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.124.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.124.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.124.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.125.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.125.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.125.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.125.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.125.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.125.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.126.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.126.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.126.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.126.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.126.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.126.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.127.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.127.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.127.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.127.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.127.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.127.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.128.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.128.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.128.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.128.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.128.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.128.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.129.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.129.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.129.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.129.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.129.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.129.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.130.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.130.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.130.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.130.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.130.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.130.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.131.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.131.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.131.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.131.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.131.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.131.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.132.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.132.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.132.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.132.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.132.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.132.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.133.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.133.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.133.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.133.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.133.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.133.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.134.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.134.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.134.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.134.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.134.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.134.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.135.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.135.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.135.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.135.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.135.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.135.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.136.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.136.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.136.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.136.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.136.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.136.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.137.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.137.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.137.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.137.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.137.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.137.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.138.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.138.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.138.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.138.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.138.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.138.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.139.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.139.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.139.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.139.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.139.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.139.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.140.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.140.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.140.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.140.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.140.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.140.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.141.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.141.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.141.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.141.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.141.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.141.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.142.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.142.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.142.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.142.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.142.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.142.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.143.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.143.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.143.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.143.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.143.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.143.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.144.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.144.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.144.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.144.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.144.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.144.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.145.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.145.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.145.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.145.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.145.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.145.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.146.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.146.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.146.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.146.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.146.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.146.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.147.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.147.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.147.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.147.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.147.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.147.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.148.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.148.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.148.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.148.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.148.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.148.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.149.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.149.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.149.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.149.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.149.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.149.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.150.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.150.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.150.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.150.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.150.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.150.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.151.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.151.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.151.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.151.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.151.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.151.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.152.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.152.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.152.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.152.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.152.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.152.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.153.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.153.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.153.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.153.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.153.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.153.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.154.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.154.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.154.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.154.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.154.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.154.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.155.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.155.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.155.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.155.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.155.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.155.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.156.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.156.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.156.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.156.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.156.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.156.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.157.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.157.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.157.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.157.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.157.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.157.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.158.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.158.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.158.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.158.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.158.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.158.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.159.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.159.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.159.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.159.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.159.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.159.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.160.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.160.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.160.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.160.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.160.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.160.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.161.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.161.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.161.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.161.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.161.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.161.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.162.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.162.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.162.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.162.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.162.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.162.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.163.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.163.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.163.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.163.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.163.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.163.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.164.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.164.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.164.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.164.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.164.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.164.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.165.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.165.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.165.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.165.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.165.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.165.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.166.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.166.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.166.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.166.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.166.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.166.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.167.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.167.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.167.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.167.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.167.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.167.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.168.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.168.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.168.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.168.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.168.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.168.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.169.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.169.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.169.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.169.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.169.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.169.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.170.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.170.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.170.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.170.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.170.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.170.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.171.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.171.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.171.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.171.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.171.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.171.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.172.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.172.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.172.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.172.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.172.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.172.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.173.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.173.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.173.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.173.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.173.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.173.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.174.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.174.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.174.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.174.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.174.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.174.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.175.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.175.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.175.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.175.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.175.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.175.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.176.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.176.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.176.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.176.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.176.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.176.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.177.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.177.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.177.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.177.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.177.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.177.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.178.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.178.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.178.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.178.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.178.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.178.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.179.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.179.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.179.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.179.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.179.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.179.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.180.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.180.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.180.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.180.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.180.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.180.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.181.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.181.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.181.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.181.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.181.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.181.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.182.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.182.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.182.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.182.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.182.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.182.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.183.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.183.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.183.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.183.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.183.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.183.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.184.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.184.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.184.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.184.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.184.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.184.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.185.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.185.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.185.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.185.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.185.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.185.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.186.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.186.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.186.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.186.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.186.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.186.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.187.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.187.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.187.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.187.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.187.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.187.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.188.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.188.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.188.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.188.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.188.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.188.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.189.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.189.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.189.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.189.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.189.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.189.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.190.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.190.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.190.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.190.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.190.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.190.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.191.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.191.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.191.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.191.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.191.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.191.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.192.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.192.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.192.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.192.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.192.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.192.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.193.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.193.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.193.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.193.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.193.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.193.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.194.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.194.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.194.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.194.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.194.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.194.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.195.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.195.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.195.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.195.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.195.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.195.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.196.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.196.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.196.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.196.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.196.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.196.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.197.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.197.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.197.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.197.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.197.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.197.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.198.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.198.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.198.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.198.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.198.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.198.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.199.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.199.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.199.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.199.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.199.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.199.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.200.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.200.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.200.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.200.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.200.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.200.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.201.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.201.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.201.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.201.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.201.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.201.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.202.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.202.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.202.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.202.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.202.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.202.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.203.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.203.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.203.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.203.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.203.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.203.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.204.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.204.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.204.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.204.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.204.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.204.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.205.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.205.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.205.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.205.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.205.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.205.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.206.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.206.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.206.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.206.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.206.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.206.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.207.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.207.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.207.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.207.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.207.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.207.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.208.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.208.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.208.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.208.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.208.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.208.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.209.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.209.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.209.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.209.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.209.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.209.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.210.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.210.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.210.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.210.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.210.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.210.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.211.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.211.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.211.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.211.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.211.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.211.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.212.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.212.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.212.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.212.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.212.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.212.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.213.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.213.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.213.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.213.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.213.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.213.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.214.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.214.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.214.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.214.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.214.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.214.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.215.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.215.gate_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.215.up_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.215.up_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.215.down_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.215.down_proj.weight_scale_inv": "model-00099-of-000163.safetensors", "model.layers.38.mlp.experts.216.gate_proj.weight": "model-00099-of-000163.safetensors", - "model.layers.38.mlp.experts.216.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.216.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.216.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.216.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.216.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.217.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.217.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.217.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.217.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.217.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.217.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.218.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.218.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.218.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.218.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.218.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.218.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.219.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.219.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.219.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.219.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.219.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.219.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.220.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.220.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.220.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.220.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.220.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.220.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.221.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.221.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.221.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.221.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.221.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.221.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.222.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.222.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.222.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.222.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.222.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.222.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.223.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.223.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.223.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.223.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.223.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.223.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.224.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.224.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.224.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.224.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.224.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.224.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.225.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.225.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.225.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.225.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.225.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.225.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.226.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.226.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.226.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.226.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.226.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.226.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.227.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.227.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.227.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.227.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.227.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.227.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.228.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.228.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.228.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.228.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.228.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.228.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.229.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.229.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.229.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.229.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.229.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.229.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.230.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.230.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.230.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.230.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.230.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.230.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.231.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.231.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.231.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.231.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.231.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.231.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.232.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.232.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.232.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.232.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.232.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.232.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.233.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.233.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.233.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.233.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.233.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.233.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.234.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.234.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.234.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.234.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.234.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.234.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.235.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.235.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.235.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.235.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.235.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.235.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.236.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.236.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.236.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.236.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.236.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.236.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.237.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.237.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.237.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.237.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.237.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.237.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.238.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.238.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.238.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.238.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.238.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.238.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.239.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.239.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.239.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.239.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.239.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.239.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.240.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.240.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.240.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.240.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.240.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.240.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.241.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.241.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.241.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.241.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.241.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.241.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.242.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.242.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.242.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.242.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.242.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.242.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.243.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.243.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.243.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.243.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.243.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.243.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.244.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.244.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.244.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.244.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.244.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.244.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.245.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.245.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.245.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.245.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.245.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.245.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.246.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.246.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.246.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.246.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.246.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.246.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.247.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.247.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.247.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.247.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.247.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.247.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.248.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.248.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.248.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.248.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.248.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.248.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.249.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.249.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.249.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.249.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.249.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.249.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.250.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.250.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.250.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.250.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.250.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.250.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.251.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.251.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.251.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.251.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.251.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.251.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.252.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.252.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.252.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.252.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.252.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.252.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.253.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.253.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.253.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.253.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.253.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.253.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.254.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.254.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.254.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.254.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.254.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.254.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.255.gate_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.255.gate_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.255.up_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.255.up_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.mlp.experts.255.down_proj.weight": "model-00100-of-000163.safetensors", - "model.layers.38.mlp.experts.255.down_proj.weight_scale_inv": "model-00100-of-000163.safetensors", "model.layers.38.input_layernorm.weight": "model-00100-of-000163.safetensors", "model.layers.38.post_attention_layernorm.weight": "model-00100-of-000163.safetensors", "model.layers.39.self_attn.q_a_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.self_attn.q_a_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.q_a_layernorm.weight": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.q_b_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.self_attn.q_b_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.kv_a_proj_with_mqa.weight": "model-00101-of-000163.safetensors", - "model.layers.39.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.kv_a_layernorm.weight": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.kv_b_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.self_attn.kv_b_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.self_attn.o_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.self_attn.o_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.gate.weight": "model-00101-of-000163.safetensors", "model.layers.39.mlp.gate.e_score_correction_bias": "model-00101-of-000163.safetensors", "model.layers.39.mlp.shared_experts.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.shared_experts.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.shared_experts.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.shared_experts.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.shared_experts.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.0.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.0.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.0.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.0.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.0.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.0.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.1.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.1.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.1.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.1.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.1.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.1.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.2.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.2.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.2.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.2.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.2.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.2.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.3.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.3.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.3.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.3.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.3.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.3.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.4.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.4.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.4.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.4.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.4.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.4.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.5.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.5.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.5.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.5.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.5.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.5.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.6.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.6.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.6.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.6.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.6.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.6.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.7.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.7.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.7.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.7.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.7.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.7.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.8.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.8.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.8.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.8.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.8.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.8.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.9.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.9.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.9.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.9.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.9.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.9.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.10.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.10.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.10.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.10.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.10.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.10.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.11.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.11.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.11.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.11.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.11.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.11.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.12.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.12.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.12.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.12.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.12.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.12.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.13.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.13.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.13.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.13.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.13.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.13.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.14.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.14.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.14.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.14.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.14.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.14.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.15.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.15.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.15.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.15.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.15.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.15.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.16.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.16.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.16.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.16.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.16.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.16.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.17.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.17.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.17.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.17.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.17.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.17.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.18.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.18.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.18.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.18.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.18.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.18.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.19.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.19.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.19.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.19.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.19.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.19.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.20.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.20.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.20.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.20.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.20.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.20.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.21.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.21.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.21.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.21.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.21.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.21.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.22.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.22.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.22.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.22.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.22.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.22.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.23.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.23.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.23.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.23.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.23.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.23.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.24.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.24.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.24.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.24.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.24.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.24.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.25.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.25.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.25.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.25.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.25.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.25.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.26.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.26.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.26.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.26.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.26.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.26.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.27.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.27.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.27.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.27.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.27.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.27.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.28.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.28.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.28.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.28.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.28.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.28.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.29.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.29.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.29.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.29.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.29.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.29.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.30.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.30.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.30.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.30.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.30.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.30.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.31.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.31.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.31.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.31.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.31.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.31.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.32.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.32.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.32.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.32.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.32.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.32.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.33.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.33.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.33.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.33.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.33.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.33.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.34.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.34.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.34.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.34.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.34.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.34.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.35.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.35.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.35.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.35.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.35.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.35.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.36.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.36.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.36.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.36.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.36.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.36.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.37.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.37.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.37.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.37.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.37.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.37.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.38.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.38.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.38.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.38.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.38.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.38.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.39.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.39.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.39.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.39.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.39.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.39.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.40.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.40.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.40.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.40.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.40.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.40.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.41.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.41.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.41.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.41.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.41.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.41.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.42.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.42.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.42.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.42.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.42.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.42.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.43.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.43.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.43.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.43.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.43.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.43.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.44.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.44.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.44.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.44.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.44.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.44.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.45.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.45.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.45.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.45.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.45.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.45.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.46.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.46.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.46.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.46.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.46.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.46.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.47.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.47.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.47.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.47.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.47.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.47.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.48.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.48.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.48.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.48.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.48.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.48.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.49.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.49.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.49.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.49.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.49.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.49.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.50.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.50.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.50.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.50.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.50.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.50.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.51.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.51.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.51.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.51.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.51.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.51.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.52.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.52.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.52.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.52.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.52.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.52.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.53.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.53.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.53.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.53.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.53.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.53.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.54.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.54.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.54.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.54.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.54.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.54.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.55.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.55.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.55.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.55.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.55.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.55.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.56.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.56.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.56.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.56.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.56.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.56.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.57.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.57.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.57.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.57.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.57.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.57.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.58.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.58.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.58.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.58.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.58.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.58.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.59.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.59.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.59.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.59.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.59.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.59.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.60.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.60.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.60.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.60.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.60.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.60.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.61.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.61.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.61.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.61.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.61.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.61.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.62.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.62.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.62.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.62.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.62.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.62.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.63.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.63.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.63.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.63.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.63.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.63.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.64.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.64.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.64.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.64.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.64.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.64.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.65.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.65.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.65.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.65.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.65.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.65.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.66.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.66.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.66.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.66.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.66.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.66.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.67.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.67.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.67.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.67.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.67.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.67.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.68.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.68.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.68.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.68.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.68.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.68.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.69.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.69.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.69.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.69.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.69.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.69.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.70.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.70.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.70.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.70.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.70.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.70.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.71.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.71.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.71.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.71.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.71.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.71.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.72.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.72.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.72.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.72.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.72.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.72.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.73.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.73.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.73.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.73.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.73.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.73.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.74.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.74.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.74.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.74.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.74.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.74.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.75.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.75.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.75.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.75.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.75.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.75.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.76.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.76.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.76.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.76.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.76.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.76.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.77.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.77.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.77.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.77.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.77.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.77.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.78.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.78.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.78.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.78.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.78.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.78.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.79.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.79.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.79.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.79.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.79.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.79.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.80.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.80.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.80.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.80.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.80.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.80.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.81.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.81.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.81.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.81.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.81.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.81.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.82.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.82.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.82.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.82.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.82.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.82.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.83.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.83.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.83.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.83.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.83.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.83.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.84.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.84.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.84.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.84.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.84.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.84.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.85.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.85.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.85.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.85.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.85.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.85.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.86.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.86.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.86.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.86.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.86.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.86.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.87.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.87.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.87.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.87.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.87.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.87.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.88.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.88.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.88.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.88.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.88.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.88.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.89.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.89.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.89.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.89.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.89.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.89.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.90.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.90.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.90.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.90.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.90.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.90.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.91.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.91.gate_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.91.up_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.91.up_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.91.down_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.91.down_proj.weight_scale_inv": "model-00101-of-000163.safetensors", "model.layers.39.mlp.experts.92.gate_proj.weight": "model-00101-of-000163.safetensors", - "model.layers.39.mlp.experts.92.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.92.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.92.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.92.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.92.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.93.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.93.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.93.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.93.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.93.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.93.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.94.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.94.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.94.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.94.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.94.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.94.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.95.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.95.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.95.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.95.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.95.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.95.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.96.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.96.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.96.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.96.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.96.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.96.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.97.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.97.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.97.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.97.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.97.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.97.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.98.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.98.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.98.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.98.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.98.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.98.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.99.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.99.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.99.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.99.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.99.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.99.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.100.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.100.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.100.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.100.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.100.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.100.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.101.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.101.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.101.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.101.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.101.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.101.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.102.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.102.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.102.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.102.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.102.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.102.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.103.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.103.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.103.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.103.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.103.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.103.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.104.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.104.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.104.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.104.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.104.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.104.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.105.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.105.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.105.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.105.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.105.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.105.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.106.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.106.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.106.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.106.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.106.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.106.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.107.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.107.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.107.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.107.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.107.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.107.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.108.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.108.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.108.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.108.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.108.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.108.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.109.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.109.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.109.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.109.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.109.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.109.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.110.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.110.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.110.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.110.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.110.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.110.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.111.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.111.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.111.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.111.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.111.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.111.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.112.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.112.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.112.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.112.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.112.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.112.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.113.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.113.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.113.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.113.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.113.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.113.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.114.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.114.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.114.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.114.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.114.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.114.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.115.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.115.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.115.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.115.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.115.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.115.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.116.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.116.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.116.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.116.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.116.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.116.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.117.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.117.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.117.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.117.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.117.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.117.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.118.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.118.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.118.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.118.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.118.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.118.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.119.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.119.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.119.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.119.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.119.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.119.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.120.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.120.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.120.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.120.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.120.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.120.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.121.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.121.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.121.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.121.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.121.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.121.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.122.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.122.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.122.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.122.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.122.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.122.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.123.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.123.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.123.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.123.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.123.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.123.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.124.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.124.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.124.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.124.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.124.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.124.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.125.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.125.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.125.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.125.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.125.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.125.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.126.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.126.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.126.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.126.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.126.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.126.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.127.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.127.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.127.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.127.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.127.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.127.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.128.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.128.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.128.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.128.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.128.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.128.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.129.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.129.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.129.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.129.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.129.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.129.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.130.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.130.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.130.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.130.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.130.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.130.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.131.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.131.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.131.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.131.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.131.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.131.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.132.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.132.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.132.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.132.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.132.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.132.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.133.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.133.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.133.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.133.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.133.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.133.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.134.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.134.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.134.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.134.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.134.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.134.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.135.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.135.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.135.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.135.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.135.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.135.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.136.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.136.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.136.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.136.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.136.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.136.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.137.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.137.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.137.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.137.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.137.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.137.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.138.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.138.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.138.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.138.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.138.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.138.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.139.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.139.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.139.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.139.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.139.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.139.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.140.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.140.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.140.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.140.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.140.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.140.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.141.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.141.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.141.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.141.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.141.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.141.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.142.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.142.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.142.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.142.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.142.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.142.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.143.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.143.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.143.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.143.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.143.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.143.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.144.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.144.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.144.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.144.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.144.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.144.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.145.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.145.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.145.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.145.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.145.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.145.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.146.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.146.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.146.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.146.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.146.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.146.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.147.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.147.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.147.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.147.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.147.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.147.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.148.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.148.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.148.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.148.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.148.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.148.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.149.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.149.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.149.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.149.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.149.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.149.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.150.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.150.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.150.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.150.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.150.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.150.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.151.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.151.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.151.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.151.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.151.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.151.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.152.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.152.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.152.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.152.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.152.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.152.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.153.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.153.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.153.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.153.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.153.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.153.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.154.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.154.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.154.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.154.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.154.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.154.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.155.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.155.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.155.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.155.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.155.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.155.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.156.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.156.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.156.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.156.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.156.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.156.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.157.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.157.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.157.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.157.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.157.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.157.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.158.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.158.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.158.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.158.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.158.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.158.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.159.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.159.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.159.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.159.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.159.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.159.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.160.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.160.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.160.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.160.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.160.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.160.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.161.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.161.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.161.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.161.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.161.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.161.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.162.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.162.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.162.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.162.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.162.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.162.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.163.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.163.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.163.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.163.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.163.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.163.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.164.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.164.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.164.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.164.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.164.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.164.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.165.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.165.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.165.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.165.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.165.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.165.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.166.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.166.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.166.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.166.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.166.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.166.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.167.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.167.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.167.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.167.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.167.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.167.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.168.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.168.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.168.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.168.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.168.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.168.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.169.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.169.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.169.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.169.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.169.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.169.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.170.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.170.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.170.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.170.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.170.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.170.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.171.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.171.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.171.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.171.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.171.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.171.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.172.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.172.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.172.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.172.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.172.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.172.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.173.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.173.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.173.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.173.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.173.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.173.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.174.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.174.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.174.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.174.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.174.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.174.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.175.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.175.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.175.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.175.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.175.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.175.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.176.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.176.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.176.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.176.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.176.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.176.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.177.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.177.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.177.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.177.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.177.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.177.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.178.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.178.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.178.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.178.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.178.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.178.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.179.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.179.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.179.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.179.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.179.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.179.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.180.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.180.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.180.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.180.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.180.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.180.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.181.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.181.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.181.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.181.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.181.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.181.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.182.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.182.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.182.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.182.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.182.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.182.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.183.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.183.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.183.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.183.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.183.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.183.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.184.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.184.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.184.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.184.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.184.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.184.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.185.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.185.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.185.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.185.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.185.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.185.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.186.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.186.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.186.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.186.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.186.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.186.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.187.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.187.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.187.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.187.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.187.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.187.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.188.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.188.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.188.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.188.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.188.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.188.down_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.189.gate_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.189.gate_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.189.up_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.189.up_proj.weight_scale_inv": "model-00102-of-000163.safetensors", "model.layers.39.mlp.experts.189.down_proj.weight": "model-00102-of-000163.safetensors", - "model.layers.39.mlp.experts.189.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.190.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.190.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.190.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.190.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.190.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.190.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.191.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.191.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.191.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.191.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.191.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.191.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.192.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.192.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.192.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.192.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.192.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.192.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.193.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.193.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.193.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.193.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.193.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.193.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.194.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.194.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.194.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.194.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.194.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.194.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.195.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.195.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.195.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.195.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.195.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.195.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.196.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.196.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.196.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.196.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.196.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.196.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.197.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.197.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.197.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.197.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.197.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.197.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.198.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.198.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.198.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.198.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.198.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.198.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.199.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.199.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.199.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.199.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.199.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.199.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.200.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.200.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.200.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.200.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.200.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.200.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.201.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.201.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.201.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.201.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.201.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.201.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.202.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.202.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.202.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.202.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.202.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.202.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.203.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.203.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.203.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.203.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.203.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.203.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.204.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.204.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.204.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.204.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.204.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.204.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.205.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.205.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.205.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.205.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.205.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.205.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.206.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.206.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.206.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.206.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.206.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.206.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.207.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.207.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.207.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.207.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.207.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.207.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.208.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.208.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.208.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.208.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.208.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.208.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.209.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.209.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.209.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.209.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.209.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.209.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.210.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.210.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.210.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.210.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.210.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.210.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.211.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.211.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.211.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.211.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.211.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.211.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.212.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.212.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.212.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.212.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.212.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.212.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.213.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.213.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.213.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.213.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.213.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.213.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.214.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.214.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.214.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.214.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.214.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.214.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.215.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.215.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.215.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.215.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.215.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.215.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.216.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.216.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.216.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.216.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.216.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.216.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.217.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.217.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.217.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.217.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.217.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.217.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.218.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.218.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.218.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.218.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.218.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.218.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.219.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.219.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.219.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.219.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.219.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.219.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.220.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.220.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.220.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.220.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.220.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.220.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.221.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.221.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.221.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.221.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.221.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.221.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.222.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.222.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.222.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.222.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.222.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.222.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.223.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.223.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.223.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.223.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.223.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.223.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.224.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.224.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.224.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.224.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.224.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.224.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.225.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.225.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.225.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.225.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.225.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.225.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.226.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.226.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.226.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.226.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.226.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.226.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.227.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.227.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.227.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.227.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.227.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.227.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.228.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.228.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.228.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.228.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.228.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.228.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.229.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.229.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.229.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.229.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.229.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.229.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.230.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.230.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.230.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.230.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.230.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.230.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.231.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.231.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.231.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.231.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.231.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.231.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.232.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.232.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.232.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.232.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.232.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.232.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.233.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.233.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.233.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.233.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.233.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.233.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.234.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.234.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.234.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.234.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.234.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.234.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.235.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.235.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.235.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.235.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.235.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.235.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.236.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.236.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.236.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.236.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.236.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.236.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.237.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.237.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.237.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.237.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.237.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.237.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.238.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.238.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.238.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.238.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.238.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.238.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.239.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.239.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.239.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.239.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.239.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.239.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.240.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.240.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.240.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.240.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.240.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.240.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.241.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.241.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.241.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.241.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.241.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.241.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.242.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.242.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.242.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.242.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.242.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.242.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.243.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.243.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.243.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.243.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.243.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.243.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.244.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.244.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.244.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.244.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.244.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.244.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.245.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.245.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.245.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.245.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.245.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.245.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.246.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.246.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.246.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.246.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.246.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.246.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.247.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.247.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.247.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.247.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.247.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.247.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.248.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.248.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.248.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.248.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.248.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.248.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.249.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.249.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.249.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.249.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.249.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.249.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.250.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.250.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.250.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.250.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.250.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.250.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.251.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.251.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.251.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.251.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.251.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.251.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.252.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.252.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.252.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.252.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.252.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.252.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.253.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.253.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.253.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.253.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.253.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.253.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.254.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.254.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.254.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.254.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.254.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.254.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.255.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.255.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.255.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.255.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.mlp.experts.255.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.39.mlp.experts.255.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.39.input_layernorm.weight": "model-00103-of-000163.safetensors", "model.layers.39.post_attention_layernorm.weight": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.q_a_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.self_attn.q_a_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.q_a_layernorm.weight": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.q_b_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.self_attn.q_b_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.kv_a_proj_with_mqa.weight": "model-00103-of-000163.safetensors", - "model.layers.40.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.kv_a_layernorm.weight": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.kv_b_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.self_attn.kv_b_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.self_attn.o_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.self_attn.o_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.gate.weight": "model-00103-of-000163.safetensors", "model.layers.40.mlp.gate.e_score_correction_bias": "model-00103-of-000163.safetensors", "model.layers.40.mlp.shared_experts.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.shared_experts.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.shared_experts.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.shared_experts.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.shared_experts.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.0.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.0.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.0.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.0.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.0.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.0.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.1.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.1.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.1.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.1.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.1.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.1.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.2.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.2.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.2.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.2.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.2.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.2.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.3.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.3.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.3.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.3.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.3.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.3.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.4.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.4.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.4.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.4.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.4.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.4.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.5.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.5.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.5.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.5.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.5.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.5.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.6.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.6.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.6.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.6.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.6.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.6.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.7.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.7.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.7.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.7.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.7.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.7.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.8.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.8.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.8.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.8.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.8.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.8.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.9.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.9.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.9.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.9.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.9.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.9.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.10.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.10.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.10.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.10.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.10.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.10.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.11.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.11.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.11.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.11.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.11.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.11.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.12.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.12.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.12.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.12.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.12.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.12.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.13.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.13.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.13.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.13.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.13.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.13.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.14.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.14.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.14.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.14.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.14.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.14.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.15.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.15.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.15.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.15.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.15.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.15.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.16.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.16.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.16.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.16.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.16.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.16.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.17.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.17.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.17.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.17.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.17.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.17.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.18.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.18.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.18.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.18.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.18.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.18.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.19.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.19.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.19.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.19.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.19.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.19.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.20.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.20.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.20.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.20.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.20.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.20.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.21.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.21.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.21.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.21.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.21.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.21.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.22.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.22.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.22.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.22.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.22.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.22.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.23.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.23.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.23.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.23.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.23.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.23.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.24.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.24.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.24.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.24.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.24.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.24.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.25.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.25.gate_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.25.up_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.25.up_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.25.down_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.25.down_proj.weight_scale_inv": "model-00103-of-000163.safetensors", "model.layers.40.mlp.experts.26.gate_proj.weight": "model-00103-of-000163.safetensors", - "model.layers.40.mlp.experts.26.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.26.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.26.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.26.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.26.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.27.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.27.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.27.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.27.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.27.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.27.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.28.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.28.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.28.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.28.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.28.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.28.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.29.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.29.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.29.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.29.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.29.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.29.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.30.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.30.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.30.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.30.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.30.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.30.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.31.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.31.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.31.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.31.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.31.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.31.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.32.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.32.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.32.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.32.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.32.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.32.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.33.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.33.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.33.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.33.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.33.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.33.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.34.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.34.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.34.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.34.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.34.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.34.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.35.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.35.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.35.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.35.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.35.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.35.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.36.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.36.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.36.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.36.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.36.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.36.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.37.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.37.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.37.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.37.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.37.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.37.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.38.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.38.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.38.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.38.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.38.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.38.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.39.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.39.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.39.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.39.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.39.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.39.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.40.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.40.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.40.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.40.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.40.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.40.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.41.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.41.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.41.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.41.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.41.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.41.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.42.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.42.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.42.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.42.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.42.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.42.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.43.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.43.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.43.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.43.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.43.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.43.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.44.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.44.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.44.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.44.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.44.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.44.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.45.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.45.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.45.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.45.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.45.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.45.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.46.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.46.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.46.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.46.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.46.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.46.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.47.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.47.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.47.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.47.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.47.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.47.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.48.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.48.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.48.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.48.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.48.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.48.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.49.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.49.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.49.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.49.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.49.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.49.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.50.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.50.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.50.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.50.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.50.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.50.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.51.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.51.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.51.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.51.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.51.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.51.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.52.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.52.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.52.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.52.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.52.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.52.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.53.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.53.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.53.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.53.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.53.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.53.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.54.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.54.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.54.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.54.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.54.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.54.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.55.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.55.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.55.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.55.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.55.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.55.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.56.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.56.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.56.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.56.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.56.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.56.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.57.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.57.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.57.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.57.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.57.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.57.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.58.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.58.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.58.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.58.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.58.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.58.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.59.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.59.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.59.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.59.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.59.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.59.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.60.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.60.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.60.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.60.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.60.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.60.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.61.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.61.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.61.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.61.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.61.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.61.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.62.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.62.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.62.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.62.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.62.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.62.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.63.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.63.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.63.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.63.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.63.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.63.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.64.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.64.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.64.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.64.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.64.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.64.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.65.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.65.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.65.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.65.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.65.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.65.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.66.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.66.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.66.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.66.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.66.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.66.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.67.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.67.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.67.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.67.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.67.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.67.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.68.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.68.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.68.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.68.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.68.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.68.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.69.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.69.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.69.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.69.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.69.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.69.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.70.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.70.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.70.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.70.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.70.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.70.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.71.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.71.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.71.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.71.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.71.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.71.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.72.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.72.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.72.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.72.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.72.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.72.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.73.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.73.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.73.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.73.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.73.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.73.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.74.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.74.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.74.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.74.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.74.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.74.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.75.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.75.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.75.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.75.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.75.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.75.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.76.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.76.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.76.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.76.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.76.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.76.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.77.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.77.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.77.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.77.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.77.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.77.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.78.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.78.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.78.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.78.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.78.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.78.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.79.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.79.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.79.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.79.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.79.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.79.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.80.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.80.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.80.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.80.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.80.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.80.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.81.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.81.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.81.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.81.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.81.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.81.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.82.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.82.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.82.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.82.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.82.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.82.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.83.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.83.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.83.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.83.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.83.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.83.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.84.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.84.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.84.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.84.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.84.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.84.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.85.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.85.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.85.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.85.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.85.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.85.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.86.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.86.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.86.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.86.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.86.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.86.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.87.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.87.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.87.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.87.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.87.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.87.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.88.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.88.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.88.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.88.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.88.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.88.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.89.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.89.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.89.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.89.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.89.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.89.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.90.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.90.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.90.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.90.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.90.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.90.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.91.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.91.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.91.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.91.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.91.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.91.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.92.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.92.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.92.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.92.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.92.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.92.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.93.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.93.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.93.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.93.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.93.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.93.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.94.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.94.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.94.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.94.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.94.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.94.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.95.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.95.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.95.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.95.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.95.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.95.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.96.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.96.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.96.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.96.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.96.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.96.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.97.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.97.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.97.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.97.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.97.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.97.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.98.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.98.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.98.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.98.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.98.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.98.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.99.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.99.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.99.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.99.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.99.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.99.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.100.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.100.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.100.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.100.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.100.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.100.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.101.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.101.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.101.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.101.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.101.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.101.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.102.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.102.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.102.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.102.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.102.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.102.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.103.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.103.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.103.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.103.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.103.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.103.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.104.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.104.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.104.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.104.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.104.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.104.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.105.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.105.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.105.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.105.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.105.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.105.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.106.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.106.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.106.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.106.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.106.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.106.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.107.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.107.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.107.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.107.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.107.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.107.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.108.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.108.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.108.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.108.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.108.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.108.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.109.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.109.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.109.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.109.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.109.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.109.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.110.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.110.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.110.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.110.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.110.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.110.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.111.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.111.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.111.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.111.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.111.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.111.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.112.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.112.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.112.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.112.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.112.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.112.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.113.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.113.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.113.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.113.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.113.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.113.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.114.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.114.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.114.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.114.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.114.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.114.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.115.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.115.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.115.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.115.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.115.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.115.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.116.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.116.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.116.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.116.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.116.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.116.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.117.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.117.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.117.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.117.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.117.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.117.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.118.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.118.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.118.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.118.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.118.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.118.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.119.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.119.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.119.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.119.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.119.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.119.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.120.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.120.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.120.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.120.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.120.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.120.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.121.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.121.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.121.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.121.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.121.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.121.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.122.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.122.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.122.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.122.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.122.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.122.down_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.123.gate_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.123.gate_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.123.up_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.123.up_proj.weight_scale_inv": "model-00104-of-000163.safetensors", "model.layers.40.mlp.experts.123.down_proj.weight": "model-00104-of-000163.safetensors", - "model.layers.40.mlp.experts.123.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.124.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.124.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.124.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.124.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.124.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.124.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.125.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.125.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.125.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.125.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.125.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.125.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.126.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.126.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.126.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.126.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.126.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.126.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.127.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.127.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.127.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.127.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.127.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.127.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.128.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.128.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.128.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.128.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.128.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.128.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.129.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.129.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.129.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.129.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.129.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.129.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.130.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.130.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.130.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.130.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.130.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.130.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.131.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.131.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.131.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.131.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.131.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.131.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.132.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.132.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.132.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.132.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.132.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.132.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.133.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.133.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.133.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.133.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.133.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.133.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.134.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.134.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.134.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.134.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.134.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.134.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.135.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.135.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.135.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.135.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.135.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.135.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.136.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.136.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.136.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.136.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.136.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.136.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.137.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.137.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.137.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.137.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.137.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.137.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.138.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.138.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.138.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.138.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.138.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.138.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.139.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.139.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.139.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.139.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.139.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.139.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.140.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.140.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.140.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.140.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.140.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.140.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.141.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.141.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.141.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.141.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.141.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.141.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.142.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.142.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.142.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.142.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.142.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.142.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.143.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.143.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.143.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.143.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.143.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.143.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.144.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.144.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.144.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.144.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.144.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.144.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.145.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.145.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.145.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.145.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.145.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.145.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.146.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.146.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.146.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.146.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.146.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.146.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.147.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.147.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.147.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.147.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.147.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.147.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.148.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.148.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.148.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.148.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.148.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.148.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.149.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.149.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.149.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.149.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.149.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.149.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.150.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.150.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.150.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.150.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.150.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.150.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.151.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.151.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.151.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.151.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.151.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.151.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.152.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.152.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.152.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.152.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.152.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.152.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.153.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.153.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.153.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.153.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.153.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.153.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.154.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.154.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.154.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.154.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.154.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.154.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.155.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.155.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.155.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.155.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.155.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.155.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.156.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.156.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.156.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.156.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.156.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.156.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.157.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.157.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.157.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.157.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.157.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.157.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.158.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.158.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.158.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.158.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.158.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.158.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.159.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.159.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.159.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.159.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.159.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.159.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.160.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.160.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.160.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.160.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.160.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.160.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.161.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.161.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.161.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.161.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.161.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.161.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.162.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.162.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.162.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.162.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.162.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.162.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.163.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.163.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.163.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.163.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.163.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.163.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.164.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.164.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.164.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.164.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.164.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.164.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.165.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.165.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.165.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.165.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.165.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.165.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.166.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.166.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.166.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.166.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.166.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.166.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.167.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.167.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.167.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.167.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.167.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.167.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.168.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.168.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.168.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.168.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.168.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.168.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.169.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.169.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.169.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.169.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.169.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.169.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.170.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.170.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.170.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.170.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.170.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.170.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.171.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.171.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.171.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.171.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.171.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.171.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.172.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.172.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.172.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.172.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.172.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.172.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.173.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.173.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.173.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.173.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.173.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.173.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.174.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.174.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.174.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.174.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.174.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.174.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.175.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.175.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.175.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.175.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.175.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.175.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.176.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.176.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.176.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.176.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.176.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.176.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.177.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.177.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.177.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.177.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.177.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.177.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.178.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.178.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.178.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.178.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.178.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.178.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.179.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.179.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.179.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.179.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.179.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.179.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.180.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.180.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.180.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.180.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.180.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.180.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.181.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.181.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.181.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.181.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.181.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.181.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.182.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.182.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.182.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.182.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.182.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.182.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.183.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.183.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.183.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.183.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.183.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.183.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.184.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.184.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.184.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.184.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.184.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.184.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.185.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.185.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.185.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.185.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.185.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.185.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.186.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.186.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.186.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.186.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.186.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.186.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.187.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.187.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.187.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.187.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.187.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.187.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.188.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.188.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.188.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.188.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.188.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.188.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.189.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.189.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.189.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.189.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.189.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.189.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.190.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.190.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.190.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.190.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.190.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.190.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.191.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.191.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.191.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.191.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.191.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.191.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.192.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.192.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.192.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.192.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.192.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.192.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.193.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.193.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.193.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.193.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.193.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.193.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.194.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.194.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.194.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.194.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.194.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.194.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.195.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.195.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.195.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.195.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.195.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.195.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.196.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.196.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.196.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.196.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.196.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.196.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.197.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.197.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.197.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.197.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.197.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.197.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.198.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.198.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.198.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.198.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.198.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.198.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.199.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.199.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.199.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.199.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.199.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.199.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.200.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.200.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.200.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.200.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.200.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.200.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.201.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.201.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.201.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.201.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.201.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.201.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.202.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.202.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.202.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.202.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.202.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.202.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.203.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.203.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.203.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.203.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.203.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.203.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.204.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.204.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.204.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.204.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.204.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.204.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.205.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.205.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.205.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.205.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.205.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.205.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.206.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.206.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.206.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.206.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.206.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.206.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.207.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.207.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.207.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.207.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.207.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.207.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.208.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.208.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.208.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.208.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.208.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.208.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.209.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.209.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.209.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.209.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.209.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.209.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.210.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.210.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.210.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.210.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.210.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.210.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.211.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.211.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.211.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.211.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.211.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.211.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.212.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.212.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.212.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.212.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.212.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.212.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.213.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.213.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.213.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.213.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.213.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.213.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.214.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.214.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.214.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.214.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.214.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.214.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.215.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.215.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.215.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.215.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.215.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.215.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.216.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.216.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.216.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.216.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.216.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.216.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.217.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.217.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.217.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.217.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.217.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.217.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.218.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.218.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.218.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.218.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.218.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.218.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.219.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.219.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.219.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.219.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.219.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.219.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.220.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.220.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.220.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.220.up_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.220.down_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.220.down_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.221.gate_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.221.gate_proj.weight_scale_inv": "model-00105-of-000163.safetensors", "model.layers.40.mlp.experts.221.up_proj.weight": "model-00105-of-000163.safetensors", - "model.layers.40.mlp.experts.221.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.221.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.221.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.222.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.222.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.222.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.222.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.222.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.222.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.223.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.223.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.223.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.223.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.223.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.223.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.224.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.224.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.224.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.224.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.224.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.224.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.225.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.225.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.225.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.225.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.225.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.225.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.226.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.226.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.226.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.226.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.226.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.226.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.227.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.227.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.227.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.227.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.227.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.227.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.228.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.228.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.228.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.228.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.228.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.228.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.229.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.229.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.229.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.229.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.229.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.229.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.230.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.230.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.230.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.230.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.230.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.230.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.231.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.231.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.231.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.231.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.231.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.231.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.232.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.232.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.232.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.232.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.232.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.232.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.233.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.233.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.233.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.233.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.233.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.233.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.234.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.234.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.234.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.234.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.234.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.234.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.235.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.235.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.235.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.235.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.235.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.235.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.236.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.236.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.236.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.236.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.236.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.236.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.237.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.237.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.237.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.237.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.237.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.237.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.238.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.238.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.238.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.238.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.238.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.238.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.239.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.239.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.239.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.239.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.239.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.239.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.240.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.240.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.240.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.240.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.240.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.240.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.241.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.241.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.241.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.241.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.241.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.241.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.242.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.242.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.242.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.242.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.242.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.242.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.243.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.243.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.243.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.243.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.243.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.243.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.244.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.244.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.244.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.244.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.244.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.244.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.245.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.245.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.245.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.245.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.245.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.245.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.246.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.246.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.246.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.246.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.246.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.246.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.247.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.247.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.247.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.247.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.247.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.247.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.248.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.248.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.248.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.248.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.248.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.248.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.249.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.249.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.249.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.249.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.249.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.249.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.250.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.250.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.250.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.250.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.250.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.250.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.251.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.251.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.251.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.251.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.251.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.251.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.252.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.252.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.252.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.252.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.252.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.252.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.253.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.253.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.253.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.253.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.253.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.253.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.254.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.254.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.254.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.254.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.254.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.254.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.255.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.255.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.255.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.255.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.mlp.experts.255.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.40.mlp.experts.255.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.40.input_layernorm.weight": "model-00106-of-000163.safetensors", "model.layers.40.post_attention_layernorm.weight": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.q_a_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.self_attn.q_a_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.q_a_layernorm.weight": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.q_b_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.self_attn.q_b_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.kv_a_proj_with_mqa.weight": "model-00106-of-000163.safetensors", - "model.layers.41.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.kv_a_layernorm.weight": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.kv_b_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.self_attn.kv_b_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.self_attn.o_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.self_attn.o_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.gate.weight": "model-00106-of-000163.safetensors", "model.layers.41.mlp.gate.e_score_correction_bias": "model-00106-of-000163.safetensors", "model.layers.41.mlp.shared_experts.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.shared_experts.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.shared_experts.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.shared_experts.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.shared_experts.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.0.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.0.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.0.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.0.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.0.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.0.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.1.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.1.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.1.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.1.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.1.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.1.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.2.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.2.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.2.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.2.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.2.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.2.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.3.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.3.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.3.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.3.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.3.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.3.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.4.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.4.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.4.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.4.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.4.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.4.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.5.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.5.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.5.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.5.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.5.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.5.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.6.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.6.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.6.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.6.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.6.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.6.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.7.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.7.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.7.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.7.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.7.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.7.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.8.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.8.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.8.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.8.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.8.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.8.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.9.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.9.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.9.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.9.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.9.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.9.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.10.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.10.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.10.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.10.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.10.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.10.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.11.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.11.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.11.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.11.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.11.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.11.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.12.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.12.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.12.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.12.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.12.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.12.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.13.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.13.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.13.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.13.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.13.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.13.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.14.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.14.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.14.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.14.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.14.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.14.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.15.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.15.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.15.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.15.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.15.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.15.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.16.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.16.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.16.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.16.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.16.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.16.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.17.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.17.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.17.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.17.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.17.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.17.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.18.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.18.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.18.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.18.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.18.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.18.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.19.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.19.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.19.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.19.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.19.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.19.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.20.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.20.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.20.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.20.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.20.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.20.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.21.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.21.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.21.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.21.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.21.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.21.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.22.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.22.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.22.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.22.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.22.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.22.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.23.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.23.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.23.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.23.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.23.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.23.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.24.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.24.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.24.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.24.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.24.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.24.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.25.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.25.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.25.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.25.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.25.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.25.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.26.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.26.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.26.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.26.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.26.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.26.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.27.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.27.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.27.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.27.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.27.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.27.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.28.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.28.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.28.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.28.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.28.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.28.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.29.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.29.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.29.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.29.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.29.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.29.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.30.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.30.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.30.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.30.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.30.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.30.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.31.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.31.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.31.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.31.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.31.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.31.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.32.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.32.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.32.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.32.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.32.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.32.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.33.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.33.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.33.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.33.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.33.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.33.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.34.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.34.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.34.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.34.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.34.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.34.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.35.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.35.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.35.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.35.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.35.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.35.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.36.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.36.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.36.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.36.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.36.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.36.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.37.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.37.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.37.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.37.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.37.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.37.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.38.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.38.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.38.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.38.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.38.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.38.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.39.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.39.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.39.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.39.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.39.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.39.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.40.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.40.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.40.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.40.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.40.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.40.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.41.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.41.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.41.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.41.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.41.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.41.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.42.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.42.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.42.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.42.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.42.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.42.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.43.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.43.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.43.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.43.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.43.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.43.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.44.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.44.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.44.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.44.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.44.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.44.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.45.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.45.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.45.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.45.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.45.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.45.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.46.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.46.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.46.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.46.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.46.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.46.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.47.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.47.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.47.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.47.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.47.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.47.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.48.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.48.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.48.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.48.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.48.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.48.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.49.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.49.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.49.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.49.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.49.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.49.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.50.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.50.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.50.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.50.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.50.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.50.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.51.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.51.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.51.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.51.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.51.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.51.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.52.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.52.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.52.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.52.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.52.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.52.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.53.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.53.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.53.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.53.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.53.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.53.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.54.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.54.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.54.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.54.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.54.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.54.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.55.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.55.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.55.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.55.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.55.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.55.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.56.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.56.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.56.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.56.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.56.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.56.down_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.57.gate_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.57.gate_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.57.up_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.57.up_proj.weight_scale_inv": "model-00106-of-000163.safetensors", "model.layers.41.mlp.experts.57.down_proj.weight": "model-00106-of-000163.safetensors", - "model.layers.41.mlp.experts.57.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.58.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.58.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.58.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.58.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.58.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.58.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.59.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.59.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.59.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.59.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.59.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.59.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.60.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.60.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.60.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.60.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.60.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.60.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.61.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.61.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.61.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.61.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.61.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.61.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.62.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.62.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.62.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.62.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.62.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.62.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.63.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.63.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.63.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.63.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.63.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.63.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.64.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.64.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.64.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.64.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.64.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.64.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.65.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.65.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.65.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.65.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.65.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.65.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.66.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.66.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.66.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.66.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.66.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.66.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.67.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.67.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.67.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.67.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.67.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.67.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.68.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.68.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.68.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.68.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.68.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.68.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.69.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.69.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.69.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.69.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.69.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.69.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.70.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.70.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.70.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.70.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.70.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.70.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.71.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.71.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.71.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.71.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.71.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.71.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.72.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.72.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.72.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.72.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.72.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.72.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.73.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.73.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.73.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.73.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.73.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.73.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.74.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.74.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.74.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.74.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.74.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.74.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.75.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.75.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.75.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.75.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.75.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.75.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.76.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.76.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.76.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.76.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.76.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.76.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.77.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.77.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.77.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.77.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.77.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.77.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.78.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.78.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.78.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.78.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.78.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.78.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.79.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.79.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.79.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.79.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.79.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.79.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.80.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.80.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.80.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.80.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.80.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.80.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.81.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.81.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.81.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.81.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.81.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.81.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.82.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.82.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.82.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.82.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.82.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.82.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.83.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.83.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.83.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.83.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.83.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.83.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.84.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.84.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.84.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.84.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.84.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.84.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.85.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.85.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.85.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.85.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.85.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.85.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.86.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.86.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.86.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.86.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.86.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.86.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.87.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.87.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.87.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.87.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.87.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.87.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.88.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.88.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.88.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.88.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.88.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.88.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.89.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.89.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.89.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.89.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.89.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.89.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.90.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.90.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.90.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.90.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.90.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.90.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.91.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.91.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.91.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.91.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.91.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.91.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.92.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.92.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.92.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.92.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.92.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.92.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.93.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.93.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.93.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.93.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.93.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.93.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.94.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.94.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.94.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.94.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.94.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.94.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.95.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.95.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.95.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.95.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.95.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.95.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.96.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.96.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.96.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.96.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.96.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.96.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.97.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.97.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.97.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.97.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.97.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.97.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.98.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.98.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.98.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.98.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.98.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.98.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.99.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.99.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.99.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.99.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.99.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.99.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.100.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.100.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.100.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.100.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.100.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.100.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.101.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.101.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.101.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.101.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.101.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.101.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.102.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.102.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.102.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.102.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.102.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.102.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.103.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.103.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.103.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.103.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.103.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.103.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.104.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.104.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.104.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.104.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.104.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.104.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.105.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.105.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.105.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.105.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.105.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.105.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.106.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.106.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.106.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.106.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.106.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.106.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.107.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.107.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.107.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.107.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.107.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.107.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.108.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.108.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.108.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.108.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.108.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.108.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.109.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.109.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.109.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.109.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.109.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.109.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.110.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.110.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.110.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.110.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.110.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.110.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.111.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.111.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.111.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.111.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.111.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.111.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.112.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.112.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.112.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.112.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.112.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.112.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.113.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.113.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.113.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.113.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.113.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.113.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.114.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.114.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.114.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.114.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.114.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.114.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.115.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.115.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.115.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.115.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.115.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.115.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.116.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.116.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.116.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.116.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.116.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.116.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.117.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.117.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.117.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.117.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.117.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.117.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.118.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.118.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.118.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.118.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.118.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.118.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.119.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.119.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.119.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.119.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.119.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.119.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.120.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.120.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.120.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.120.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.120.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.120.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.121.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.121.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.121.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.121.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.121.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.121.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.122.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.122.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.122.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.122.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.122.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.122.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.123.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.123.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.123.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.123.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.123.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.123.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.124.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.124.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.124.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.124.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.124.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.124.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.125.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.125.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.125.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.125.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.125.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.125.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.126.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.126.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.126.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.126.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.126.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.126.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.127.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.127.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.127.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.127.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.127.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.127.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.128.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.128.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.128.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.128.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.128.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.128.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.129.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.129.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.129.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.129.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.129.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.129.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.130.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.130.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.130.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.130.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.130.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.130.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.131.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.131.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.131.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.131.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.131.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.131.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.132.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.132.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.132.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.132.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.132.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.132.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.133.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.133.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.133.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.133.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.133.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.133.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.134.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.134.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.134.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.134.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.134.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.134.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.135.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.135.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.135.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.135.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.135.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.135.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.136.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.136.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.136.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.136.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.136.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.136.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.137.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.137.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.137.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.137.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.137.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.137.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.138.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.138.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.138.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.138.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.138.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.138.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.139.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.139.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.139.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.139.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.139.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.139.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.140.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.140.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.140.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.140.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.140.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.140.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.141.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.141.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.141.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.141.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.141.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.141.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.142.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.142.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.142.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.142.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.142.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.142.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.143.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.143.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.143.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.143.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.143.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.143.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.144.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.144.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.144.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.144.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.144.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.144.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.145.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.145.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.145.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.145.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.145.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.145.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.146.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.146.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.146.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.146.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.146.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.146.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.147.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.147.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.147.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.147.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.147.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.147.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.148.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.148.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.148.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.148.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.148.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.148.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.149.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.149.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.149.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.149.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.149.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.149.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.150.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.150.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.150.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.150.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.150.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.150.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.151.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.151.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.151.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.151.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.151.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.151.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.152.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.152.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.152.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.152.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.152.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.152.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.153.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.153.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.153.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.153.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.153.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.153.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.154.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.154.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.154.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.154.up_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.154.down_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.154.down_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.155.gate_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.155.gate_proj.weight_scale_inv": "model-00107-of-000163.safetensors", "model.layers.41.mlp.experts.155.up_proj.weight": "model-00107-of-000163.safetensors", - "model.layers.41.mlp.experts.155.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.155.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.155.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.156.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.156.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.156.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.156.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.156.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.156.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.157.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.157.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.157.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.157.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.157.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.157.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.158.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.158.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.158.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.158.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.158.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.158.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.159.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.159.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.159.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.159.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.159.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.159.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.160.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.160.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.160.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.160.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.160.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.160.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.161.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.161.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.161.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.161.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.161.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.161.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.162.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.162.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.162.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.162.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.162.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.162.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.163.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.163.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.163.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.163.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.163.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.163.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.164.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.164.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.164.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.164.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.164.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.164.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.165.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.165.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.165.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.165.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.165.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.165.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.166.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.166.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.166.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.166.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.166.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.166.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.167.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.167.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.167.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.167.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.167.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.167.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.168.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.168.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.168.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.168.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.168.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.168.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.169.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.169.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.169.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.169.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.169.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.169.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.170.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.170.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.170.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.170.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.170.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.170.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.171.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.171.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.171.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.171.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.171.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.171.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.172.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.172.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.172.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.172.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.172.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.172.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.173.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.173.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.173.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.173.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.173.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.173.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.174.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.174.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.174.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.174.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.174.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.174.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.175.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.175.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.175.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.175.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.175.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.175.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.176.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.176.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.176.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.176.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.176.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.176.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.177.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.177.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.177.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.177.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.177.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.177.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.178.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.178.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.178.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.178.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.178.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.178.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.179.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.179.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.179.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.179.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.179.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.179.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.180.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.180.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.180.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.180.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.180.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.180.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.181.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.181.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.181.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.181.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.181.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.181.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.182.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.182.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.182.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.182.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.182.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.182.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.183.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.183.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.183.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.183.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.183.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.183.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.184.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.184.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.184.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.184.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.184.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.184.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.185.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.185.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.185.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.185.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.185.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.185.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.186.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.186.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.186.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.186.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.186.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.186.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.187.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.187.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.187.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.187.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.187.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.187.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.188.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.188.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.188.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.188.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.188.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.188.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.189.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.189.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.189.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.189.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.189.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.189.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.190.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.190.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.190.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.190.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.190.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.190.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.191.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.191.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.191.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.191.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.191.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.191.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.192.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.192.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.192.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.192.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.192.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.192.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.193.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.193.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.193.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.193.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.193.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.193.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.194.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.194.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.194.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.194.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.194.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.194.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.195.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.195.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.195.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.195.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.195.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.195.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.196.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.196.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.196.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.196.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.196.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.196.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.197.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.197.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.197.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.197.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.197.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.197.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.198.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.198.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.198.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.198.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.198.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.198.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.199.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.199.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.199.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.199.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.199.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.199.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.200.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.200.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.200.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.200.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.200.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.200.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.201.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.201.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.201.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.201.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.201.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.201.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.202.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.202.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.202.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.202.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.202.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.202.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.203.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.203.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.203.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.203.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.203.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.203.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.204.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.204.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.204.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.204.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.204.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.204.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.205.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.205.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.205.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.205.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.205.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.205.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.206.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.206.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.206.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.206.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.206.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.206.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.207.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.207.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.207.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.207.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.207.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.207.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.208.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.208.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.208.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.208.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.208.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.208.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.209.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.209.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.209.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.209.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.209.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.209.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.210.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.210.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.210.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.210.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.210.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.210.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.211.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.211.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.211.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.211.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.211.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.211.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.212.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.212.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.212.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.212.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.212.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.212.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.213.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.213.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.213.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.213.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.213.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.213.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.214.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.214.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.214.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.214.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.214.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.214.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.215.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.215.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.215.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.215.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.215.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.215.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.216.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.216.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.216.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.216.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.216.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.216.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.217.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.217.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.217.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.217.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.217.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.217.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.218.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.218.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.218.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.218.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.218.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.218.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.219.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.219.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.219.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.219.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.219.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.219.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.220.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.220.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.220.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.220.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.220.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.220.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.221.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.221.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.221.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.221.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.221.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.221.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.222.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.222.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.222.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.222.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.222.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.222.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.223.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.223.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.223.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.223.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.223.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.223.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.224.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.224.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.224.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.224.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.224.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.224.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.225.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.225.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.225.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.225.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.225.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.225.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.226.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.226.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.226.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.226.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.226.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.226.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.227.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.227.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.227.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.227.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.227.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.227.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.228.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.228.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.228.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.228.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.228.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.228.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.229.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.229.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.229.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.229.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.229.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.229.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.230.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.230.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.230.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.230.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.230.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.230.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.231.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.231.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.231.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.231.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.231.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.231.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.232.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.232.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.232.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.232.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.232.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.232.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.233.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.233.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.233.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.233.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.233.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.233.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.234.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.234.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.234.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.234.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.234.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.234.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.235.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.235.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.235.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.235.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.235.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.235.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.236.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.236.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.236.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.236.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.236.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.236.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.237.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.237.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.237.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.237.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.237.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.237.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.238.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.238.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.238.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.238.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.238.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.238.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.239.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.239.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.239.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.239.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.239.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.239.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.240.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.240.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.240.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.240.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.240.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.240.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.241.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.241.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.241.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.241.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.241.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.241.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.242.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.242.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.242.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.242.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.242.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.242.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.243.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.243.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.243.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.243.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.243.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.243.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.244.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.244.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.244.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.244.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.244.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.244.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.245.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.245.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.245.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.245.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.245.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.245.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.246.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.246.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.246.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.246.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.246.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.246.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.247.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.247.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.247.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.247.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.247.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.247.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.248.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.248.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.248.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.248.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.248.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.248.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.249.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.249.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.249.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.249.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.249.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.249.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.250.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.250.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.250.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.250.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.250.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.250.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.251.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.251.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.251.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.251.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.251.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.251.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.252.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.252.gate_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.252.up_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.252.up_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.252.down_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.252.down_proj.weight_scale_inv": "model-00108-of-000163.safetensors", "model.layers.41.mlp.experts.253.gate_proj.weight": "model-00108-of-000163.safetensors", - "model.layers.41.mlp.experts.253.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.253.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.253.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.253.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.253.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.254.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.254.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.254.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.254.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.254.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.254.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.255.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.255.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.255.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.255.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.mlp.experts.255.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.41.mlp.experts.255.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.41.input_layernorm.weight": "model-00109-of-000163.safetensors", "model.layers.41.post_attention_layernorm.weight": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.q_a_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.self_attn.q_a_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.q_a_layernorm.weight": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.q_b_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.self_attn.q_b_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.kv_a_proj_with_mqa.weight": "model-00109-of-000163.safetensors", - "model.layers.42.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.kv_a_layernorm.weight": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.kv_b_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.self_attn.kv_b_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.self_attn.o_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.self_attn.o_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.gate.weight": "model-00109-of-000163.safetensors", "model.layers.42.mlp.gate.e_score_correction_bias": "model-00109-of-000163.safetensors", "model.layers.42.mlp.shared_experts.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.shared_experts.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.shared_experts.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.shared_experts.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.shared_experts.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.0.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.0.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.0.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.0.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.0.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.0.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.1.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.1.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.1.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.1.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.1.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.1.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.2.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.2.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.2.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.2.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.2.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.2.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.3.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.3.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.3.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.3.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.3.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.3.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.4.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.4.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.4.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.4.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.4.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.4.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.5.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.5.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.5.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.5.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.5.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.5.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.6.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.6.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.6.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.6.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.6.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.6.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.7.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.7.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.7.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.7.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.7.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.7.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.8.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.8.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.8.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.8.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.8.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.8.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.9.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.9.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.9.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.9.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.9.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.9.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.10.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.10.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.10.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.10.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.10.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.10.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.11.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.11.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.11.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.11.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.11.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.11.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.12.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.12.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.12.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.12.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.12.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.12.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.13.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.13.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.13.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.13.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.13.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.13.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.14.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.14.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.14.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.14.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.14.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.14.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.15.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.15.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.15.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.15.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.15.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.15.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.16.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.16.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.16.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.16.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.16.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.16.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.17.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.17.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.17.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.17.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.17.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.17.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.18.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.18.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.18.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.18.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.18.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.18.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.19.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.19.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.19.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.19.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.19.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.19.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.20.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.20.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.20.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.20.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.20.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.20.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.21.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.21.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.21.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.21.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.21.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.21.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.22.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.22.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.22.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.22.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.22.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.22.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.23.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.23.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.23.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.23.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.23.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.23.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.24.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.24.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.24.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.24.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.24.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.24.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.25.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.25.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.25.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.25.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.25.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.25.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.26.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.26.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.26.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.26.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.26.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.26.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.27.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.27.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.27.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.27.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.27.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.27.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.28.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.28.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.28.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.28.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.28.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.28.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.29.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.29.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.29.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.29.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.29.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.29.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.30.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.30.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.30.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.30.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.30.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.30.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.31.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.31.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.31.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.31.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.31.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.31.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.32.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.32.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.32.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.32.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.32.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.32.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.33.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.33.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.33.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.33.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.33.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.33.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.34.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.34.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.34.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.34.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.34.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.34.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.35.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.35.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.35.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.35.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.35.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.35.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.36.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.36.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.36.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.36.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.36.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.36.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.37.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.37.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.37.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.37.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.37.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.37.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.38.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.38.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.38.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.38.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.38.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.38.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.39.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.39.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.39.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.39.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.39.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.39.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.40.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.40.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.40.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.40.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.40.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.40.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.41.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.41.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.41.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.41.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.41.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.41.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.42.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.42.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.42.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.42.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.42.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.42.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.43.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.43.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.43.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.43.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.43.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.43.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.44.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.44.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.44.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.44.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.44.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.44.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.45.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.45.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.45.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.45.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.45.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.45.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.46.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.46.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.46.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.46.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.46.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.46.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.47.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.47.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.47.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.47.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.47.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.47.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.48.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.48.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.48.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.48.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.48.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.48.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.49.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.49.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.49.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.49.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.49.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.49.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.50.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.50.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.50.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.50.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.50.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.50.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.51.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.51.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.51.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.51.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.51.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.51.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.52.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.52.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.52.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.52.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.52.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.52.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.53.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.53.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.53.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.53.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.53.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.53.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.54.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.54.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.54.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.54.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.54.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.54.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.55.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.55.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.55.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.55.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.55.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.55.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.56.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.56.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.56.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.56.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.56.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.56.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.57.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.57.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.57.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.57.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.57.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.57.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.58.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.58.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.58.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.58.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.58.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.58.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.59.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.59.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.59.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.59.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.59.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.59.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.60.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.60.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.60.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.60.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.60.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.60.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.61.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.61.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.61.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.61.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.61.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.61.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.62.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.62.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.62.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.62.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.62.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.62.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.63.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.63.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.63.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.63.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.63.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.63.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.64.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.64.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.64.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.64.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.64.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.64.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.65.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.65.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.65.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.65.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.65.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.65.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.66.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.66.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.66.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.66.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.66.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.66.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.67.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.67.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.67.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.67.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.67.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.67.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.68.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.68.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.68.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.68.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.68.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.68.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.69.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.69.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.69.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.69.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.69.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.69.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.70.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.70.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.70.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.70.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.70.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.70.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.71.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.71.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.71.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.71.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.71.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.71.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.72.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.72.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.72.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.72.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.72.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.72.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.73.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.73.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.73.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.73.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.73.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.73.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.74.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.74.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.74.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.74.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.74.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.74.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.75.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.75.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.75.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.75.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.75.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.75.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.76.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.76.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.76.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.76.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.76.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.76.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.77.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.77.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.77.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.77.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.77.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.77.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.78.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.78.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.78.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.78.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.78.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.78.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.79.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.79.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.79.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.79.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.79.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.79.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.80.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.80.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.80.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.80.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.80.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.80.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.81.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.81.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.81.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.81.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.81.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.81.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.82.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.82.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.82.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.82.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.82.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.82.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.83.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.83.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.83.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.83.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.83.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.83.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.84.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.84.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.84.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.84.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.84.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.84.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.85.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.85.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.85.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.85.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.85.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.85.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.86.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.86.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.86.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.86.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.86.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.86.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.87.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.87.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.87.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.87.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.87.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.87.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.88.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.88.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.88.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.88.up_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.88.down_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.88.down_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.89.gate_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.89.gate_proj.weight_scale_inv": "model-00109-of-000163.safetensors", "model.layers.42.mlp.experts.89.up_proj.weight": "model-00109-of-000163.safetensors", - "model.layers.42.mlp.experts.89.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.89.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.89.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.90.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.90.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.90.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.90.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.90.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.90.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.91.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.91.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.91.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.91.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.91.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.91.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.92.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.92.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.92.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.92.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.92.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.92.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.93.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.93.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.93.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.93.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.93.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.93.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.94.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.94.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.94.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.94.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.94.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.94.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.95.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.95.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.95.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.95.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.95.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.95.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.96.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.96.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.96.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.96.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.96.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.96.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.97.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.97.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.97.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.97.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.97.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.97.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.98.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.98.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.98.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.98.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.98.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.98.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.99.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.99.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.99.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.99.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.99.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.99.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.100.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.100.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.100.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.100.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.100.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.100.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.101.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.101.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.101.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.101.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.101.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.101.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.102.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.102.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.102.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.102.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.102.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.102.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.103.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.103.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.103.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.103.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.103.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.103.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.104.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.104.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.104.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.104.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.104.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.104.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.105.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.105.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.105.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.105.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.105.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.105.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.106.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.106.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.106.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.106.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.106.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.106.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.107.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.107.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.107.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.107.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.107.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.107.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.108.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.108.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.108.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.108.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.108.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.108.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.109.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.109.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.109.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.109.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.109.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.109.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.110.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.110.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.110.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.110.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.110.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.110.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.111.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.111.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.111.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.111.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.111.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.111.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.112.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.112.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.112.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.112.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.112.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.112.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.113.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.113.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.113.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.113.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.113.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.113.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.114.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.114.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.114.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.114.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.114.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.114.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.115.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.115.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.115.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.115.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.115.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.115.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.116.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.116.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.116.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.116.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.116.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.116.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.117.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.117.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.117.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.117.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.117.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.117.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.118.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.118.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.118.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.118.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.118.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.118.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.119.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.119.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.119.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.119.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.119.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.119.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.120.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.120.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.120.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.120.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.120.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.120.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.121.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.121.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.121.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.121.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.121.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.121.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.122.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.122.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.122.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.122.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.122.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.122.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.123.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.123.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.123.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.123.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.123.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.123.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.124.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.124.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.124.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.124.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.124.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.124.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.125.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.125.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.125.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.125.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.125.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.125.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.126.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.126.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.126.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.126.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.126.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.126.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.127.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.127.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.127.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.127.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.127.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.127.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.128.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.128.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.128.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.128.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.128.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.128.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.129.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.129.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.129.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.129.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.129.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.129.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.130.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.130.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.130.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.130.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.130.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.130.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.131.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.131.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.131.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.131.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.131.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.131.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.132.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.132.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.132.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.132.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.132.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.132.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.133.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.133.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.133.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.133.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.133.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.133.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.134.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.134.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.134.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.134.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.134.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.134.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.135.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.135.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.135.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.135.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.135.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.135.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.136.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.136.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.136.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.136.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.136.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.136.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.137.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.137.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.137.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.137.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.137.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.137.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.138.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.138.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.138.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.138.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.138.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.138.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.139.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.139.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.139.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.139.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.139.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.139.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.140.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.140.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.140.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.140.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.140.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.140.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.141.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.141.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.141.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.141.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.141.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.141.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.142.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.142.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.142.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.142.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.142.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.142.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.143.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.143.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.143.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.143.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.143.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.143.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.144.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.144.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.144.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.144.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.144.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.144.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.145.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.145.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.145.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.145.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.145.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.145.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.146.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.146.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.146.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.146.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.146.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.146.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.147.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.147.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.147.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.147.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.147.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.147.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.148.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.148.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.148.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.148.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.148.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.148.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.149.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.149.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.149.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.149.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.149.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.149.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.150.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.150.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.150.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.150.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.150.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.150.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.151.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.151.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.151.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.151.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.151.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.151.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.152.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.152.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.152.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.152.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.152.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.152.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.153.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.153.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.153.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.153.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.153.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.153.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.154.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.154.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.154.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.154.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.154.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.154.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.155.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.155.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.155.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.155.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.155.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.155.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.156.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.156.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.156.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.156.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.156.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.156.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.157.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.157.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.157.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.157.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.157.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.157.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.158.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.158.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.158.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.158.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.158.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.158.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.159.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.159.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.159.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.159.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.159.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.159.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.160.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.160.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.160.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.160.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.160.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.160.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.161.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.161.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.161.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.161.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.161.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.161.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.162.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.162.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.162.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.162.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.162.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.162.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.163.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.163.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.163.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.163.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.163.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.163.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.164.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.164.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.164.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.164.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.164.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.164.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.165.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.165.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.165.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.165.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.165.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.165.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.166.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.166.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.166.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.166.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.166.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.166.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.167.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.167.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.167.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.167.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.167.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.167.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.168.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.168.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.168.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.168.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.168.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.168.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.169.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.169.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.169.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.169.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.169.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.169.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.170.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.170.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.170.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.170.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.170.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.170.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.171.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.171.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.171.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.171.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.171.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.171.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.172.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.172.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.172.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.172.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.172.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.172.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.173.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.173.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.173.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.173.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.173.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.173.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.174.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.174.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.174.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.174.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.174.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.174.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.175.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.175.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.175.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.175.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.175.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.175.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.176.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.176.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.176.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.176.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.176.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.176.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.177.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.177.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.177.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.177.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.177.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.177.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.178.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.178.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.178.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.178.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.178.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.178.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.179.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.179.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.179.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.179.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.179.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.179.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.180.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.180.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.180.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.180.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.180.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.180.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.181.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.181.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.181.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.181.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.181.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.181.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.182.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.182.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.182.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.182.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.182.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.182.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.183.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.183.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.183.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.183.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.183.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.183.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.184.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.184.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.184.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.184.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.184.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.184.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.185.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.185.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.185.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.185.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.185.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.185.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.186.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.186.gate_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.186.up_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.186.up_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.186.down_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.186.down_proj.weight_scale_inv": "model-00110-of-000163.safetensors", "model.layers.42.mlp.experts.187.gate_proj.weight": "model-00110-of-000163.safetensors", - "model.layers.42.mlp.experts.187.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.187.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.187.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.187.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.187.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.188.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.188.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.188.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.188.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.188.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.188.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.189.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.189.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.189.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.189.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.189.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.189.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.190.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.190.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.190.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.190.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.190.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.190.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.191.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.191.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.191.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.191.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.191.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.191.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.192.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.192.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.192.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.192.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.192.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.192.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.193.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.193.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.193.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.193.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.193.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.193.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.194.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.194.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.194.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.194.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.194.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.194.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.195.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.195.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.195.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.195.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.195.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.195.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.196.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.196.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.196.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.196.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.196.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.196.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.197.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.197.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.197.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.197.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.197.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.197.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.198.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.198.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.198.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.198.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.198.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.198.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.199.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.199.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.199.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.199.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.199.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.199.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.200.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.200.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.200.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.200.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.200.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.200.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.201.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.201.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.201.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.201.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.201.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.201.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.202.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.202.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.202.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.202.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.202.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.202.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.203.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.203.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.203.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.203.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.203.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.203.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.204.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.204.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.204.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.204.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.204.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.204.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.205.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.205.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.205.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.205.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.205.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.205.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.206.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.206.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.206.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.206.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.206.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.206.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.207.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.207.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.207.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.207.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.207.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.207.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.208.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.208.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.208.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.208.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.208.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.208.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.209.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.209.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.209.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.209.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.209.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.209.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.210.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.210.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.210.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.210.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.210.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.210.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.211.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.211.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.211.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.211.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.211.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.211.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.212.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.212.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.212.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.212.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.212.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.212.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.213.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.213.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.213.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.213.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.213.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.213.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.214.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.214.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.214.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.214.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.214.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.214.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.215.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.215.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.215.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.215.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.215.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.215.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.216.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.216.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.216.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.216.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.216.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.216.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.217.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.217.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.217.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.217.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.217.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.217.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.218.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.218.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.218.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.218.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.218.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.218.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.219.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.219.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.219.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.219.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.219.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.219.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.220.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.220.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.220.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.220.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.220.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.220.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.221.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.221.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.221.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.221.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.221.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.221.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.222.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.222.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.222.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.222.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.222.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.222.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.223.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.223.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.223.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.223.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.223.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.223.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.224.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.224.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.224.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.224.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.224.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.224.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.225.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.225.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.225.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.225.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.225.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.225.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.226.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.226.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.226.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.226.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.226.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.226.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.227.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.227.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.227.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.227.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.227.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.227.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.228.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.228.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.228.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.228.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.228.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.228.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.229.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.229.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.229.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.229.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.229.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.229.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.230.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.230.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.230.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.230.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.230.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.230.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.231.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.231.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.231.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.231.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.231.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.231.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.232.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.232.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.232.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.232.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.232.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.232.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.233.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.233.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.233.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.233.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.233.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.233.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.234.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.234.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.234.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.234.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.234.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.234.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.235.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.235.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.235.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.235.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.235.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.235.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.236.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.236.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.236.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.236.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.236.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.236.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.237.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.237.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.237.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.237.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.237.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.237.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.238.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.238.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.238.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.238.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.238.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.238.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.239.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.239.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.239.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.239.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.239.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.239.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.240.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.240.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.240.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.240.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.240.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.240.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.241.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.241.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.241.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.241.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.241.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.241.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.242.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.242.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.242.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.242.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.242.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.242.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.243.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.243.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.243.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.243.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.243.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.243.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.244.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.244.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.244.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.244.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.244.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.244.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.245.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.245.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.245.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.245.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.245.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.245.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.246.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.246.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.246.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.246.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.246.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.246.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.247.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.247.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.247.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.247.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.247.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.247.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.248.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.248.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.248.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.248.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.248.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.248.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.249.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.249.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.249.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.249.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.249.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.249.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.250.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.250.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.250.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.250.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.250.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.250.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.251.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.251.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.251.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.251.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.251.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.251.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.252.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.252.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.252.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.252.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.252.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.252.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.253.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.253.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.253.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.253.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.253.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.253.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.254.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.254.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.254.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.254.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.254.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.254.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.255.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.255.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.255.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.255.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.mlp.experts.255.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.42.mlp.experts.255.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.42.input_layernorm.weight": "model-00111-of-000163.safetensors", "model.layers.42.post_attention_layernorm.weight": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.q_a_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.self_attn.q_a_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.q_a_layernorm.weight": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.q_b_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.self_attn.q_b_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.kv_a_proj_with_mqa.weight": "model-00111-of-000163.safetensors", - "model.layers.43.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.kv_a_layernorm.weight": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.kv_b_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.self_attn.kv_b_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.self_attn.o_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.self_attn.o_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.gate.weight": "model-00111-of-000163.safetensors", "model.layers.43.mlp.gate.e_score_correction_bias": "model-00111-of-000163.safetensors", "model.layers.43.mlp.shared_experts.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.shared_experts.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.shared_experts.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.shared_experts.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.shared_experts.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.0.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.0.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.0.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.0.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.0.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.0.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.1.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.1.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.1.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.1.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.1.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.1.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.2.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.2.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.2.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.2.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.2.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.2.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.3.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.3.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.3.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.3.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.3.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.3.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.4.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.4.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.4.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.4.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.4.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.4.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.5.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.5.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.5.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.5.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.5.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.5.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.6.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.6.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.6.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.6.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.6.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.6.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.7.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.7.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.7.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.7.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.7.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.7.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.8.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.8.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.8.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.8.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.8.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.8.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.9.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.9.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.9.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.9.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.9.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.9.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.10.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.10.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.10.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.10.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.10.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.10.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.11.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.11.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.11.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.11.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.11.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.11.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.12.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.12.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.12.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.12.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.12.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.12.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.13.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.13.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.13.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.13.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.13.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.13.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.14.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.14.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.14.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.14.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.14.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.14.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.15.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.15.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.15.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.15.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.15.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.15.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.16.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.16.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.16.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.16.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.16.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.16.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.17.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.17.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.17.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.17.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.17.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.17.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.18.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.18.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.18.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.18.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.18.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.18.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.19.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.19.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.19.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.19.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.19.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.19.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.20.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.20.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.20.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.20.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.20.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.20.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.21.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.21.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.21.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.21.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.21.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.21.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.22.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.22.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.22.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.22.up_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.22.down_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.22.down_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.23.gate_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.23.gate_proj.weight_scale_inv": "model-00111-of-000163.safetensors", "model.layers.43.mlp.experts.23.up_proj.weight": "model-00111-of-000163.safetensors", - "model.layers.43.mlp.experts.23.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.23.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.23.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.24.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.24.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.24.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.24.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.24.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.24.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.25.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.25.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.25.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.25.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.25.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.25.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.26.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.26.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.26.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.26.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.26.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.26.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.27.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.27.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.27.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.27.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.27.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.27.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.28.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.28.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.28.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.28.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.28.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.28.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.29.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.29.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.29.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.29.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.29.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.29.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.30.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.30.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.30.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.30.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.30.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.30.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.31.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.31.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.31.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.31.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.31.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.31.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.32.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.32.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.32.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.32.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.32.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.32.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.33.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.33.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.33.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.33.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.33.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.33.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.34.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.34.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.34.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.34.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.34.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.34.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.35.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.35.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.35.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.35.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.35.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.35.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.36.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.36.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.36.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.36.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.36.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.36.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.37.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.37.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.37.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.37.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.37.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.37.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.38.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.38.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.38.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.38.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.38.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.38.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.39.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.39.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.39.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.39.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.39.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.39.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.40.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.40.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.40.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.40.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.40.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.40.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.41.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.41.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.41.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.41.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.41.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.41.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.42.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.42.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.42.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.42.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.42.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.42.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.43.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.43.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.43.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.43.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.43.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.43.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.44.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.44.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.44.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.44.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.44.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.44.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.45.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.45.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.45.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.45.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.45.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.45.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.46.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.46.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.46.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.46.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.46.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.46.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.47.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.47.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.47.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.47.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.47.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.47.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.48.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.48.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.48.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.48.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.48.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.48.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.49.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.49.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.49.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.49.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.49.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.49.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.50.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.50.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.50.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.50.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.50.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.50.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.51.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.51.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.51.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.51.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.51.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.51.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.52.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.52.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.52.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.52.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.52.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.52.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.53.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.53.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.53.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.53.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.53.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.53.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.54.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.54.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.54.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.54.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.54.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.54.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.55.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.55.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.55.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.55.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.55.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.55.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.56.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.56.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.56.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.56.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.56.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.56.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.57.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.57.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.57.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.57.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.57.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.57.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.58.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.58.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.58.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.58.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.58.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.58.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.59.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.59.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.59.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.59.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.59.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.59.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.60.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.60.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.60.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.60.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.60.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.60.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.61.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.61.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.61.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.61.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.61.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.61.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.62.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.62.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.62.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.62.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.62.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.62.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.63.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.63.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.63.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.63.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.63.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.63.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.64.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.64.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.64.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.64.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.64.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.64.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.65.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.65.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.65.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.65.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.65.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.65.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.66.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.66.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.66.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.66.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.66.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.66.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.67.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.67.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.67.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.67.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.67.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.67.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.68.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.68.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.68.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.68.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.68.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.68.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.69.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.69.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.69.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.69.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.69.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.69.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.70.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.70.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.70.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.70.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.70.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.70.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.71.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.71.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.71.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.71.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.71.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.71.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.72.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.72.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.72.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.72.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.72.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.72.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.73.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.73.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.73.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.73.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.73.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.73.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.74.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.74.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.74.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.74.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.74.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.74.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.75.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.75.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.75.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.75.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.75.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.75.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.76.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.76.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.76.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.76.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.76.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.76.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.77.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.77.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.77.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.77.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.77.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.77.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.78.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.78.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.78.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.78.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.78.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.78.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.79.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.79.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.79.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.79.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.79.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.79.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.80.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.80.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.80.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.80.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.80.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.80.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.81.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.81.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.81.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.81.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.81.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.81.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.82.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.82.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.82.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.82.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.82.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.82.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.83.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.83.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.83.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.83.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.83.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.83.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.84.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.84.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.84.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.84.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.84.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.84.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.85.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.85.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.85.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.85.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.85.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.85.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.86.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.86.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.86.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.86.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.86.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.86.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.87.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.87.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.87.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.87.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.87.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.87.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.88.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.88.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.88.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.88.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.88.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.88.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.89.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.89.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.89.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.89.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.89.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.89.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.90.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.90.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.90.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.90.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.90.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.90.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.91.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.91.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.91.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.91.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.91.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.91.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.92.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.92.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.92.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.92.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.92.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.92.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.93.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.93.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.93.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.93.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.93.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.93.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.94.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.94.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.94.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.94.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.94.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.94.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.95.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.95.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.95.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.95.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.95.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.95.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.96.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.96.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.96.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.96.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.96.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.96.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.97.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.97.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.97.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.97.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.97.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.97.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.98.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.98.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.98.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.98.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.98.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.98.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.99.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.99.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.99.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.99.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.99.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.99.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.100.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.100.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.100.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.100.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.100.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.100.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.101.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.101.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.101.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.101.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.101.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.101.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.102.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.102.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.102.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.102.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.102.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.102.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.103.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.103.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.103.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.103.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.103.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.103.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.104.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.104.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.104.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.104.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.104.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.104.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.105.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.105.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.105.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.105.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.105.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.105.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.106.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.106.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.106.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.106.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.106.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.106.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.107.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.107.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.107.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.107.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.107.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.107.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.108.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.108.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.108.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.108.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.108.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.108.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.109.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.109.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.109.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.109.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.109.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.109.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.110.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.110.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.110.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.110.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.110.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.110.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.111.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.111.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.111.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.111.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.111.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.111.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.112.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.112.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.112.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.112.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.112.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.112.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.113.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.113.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.113.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.113.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.113.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.113.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.114.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.114.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.114.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.114.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.114.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.114.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.115.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.115.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.115.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.115.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.115.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.115.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.116.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.116.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.116.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.116.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.116.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.116.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.117.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.117.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.117.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.117.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.117.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.117.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.118.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.118.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.118.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.118.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.118.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.118.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.119.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.119.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.119.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.119.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.119.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.119.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.120.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.120.gate_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.120.up_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.120.up_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.120.down_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.120.down_proj.weight_scale_inv": "model-00112-of-000163.safetensors", "model.layers.43.mlp.experts.121.gate_proj.weight": "model-00112-of-000163.safetensors", - "model.layers.43.mlp.experts.121.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.121.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.121.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.121.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.121.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.122.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.122.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.122.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.122.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.122.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.122.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.123.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.123.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.123.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.123.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.123.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.123.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.124.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.124.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.124.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.124.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.124.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.124.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.125.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.125.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.125.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.125.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.125.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.125.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.126.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.126.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.126.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.126.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.126.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.126.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.127.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.127.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.127.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.127.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.127.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.127.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.128.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.128.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.128.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.128.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.128.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.128.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.129.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.129.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.129.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.129.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.129.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.129.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.130.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.130.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.130.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.130.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.130.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.130.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.131.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.131.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.131.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.131.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.131.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.131.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.132.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.132.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.132.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.132.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.132.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.132.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.133.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.133.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.133.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.133.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.133.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.133.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.134.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.134.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.134.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.134.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.134.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.134.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.135.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.135.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.135.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.135.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.135.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.135.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.136.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.136.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.136.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.136.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.136.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.136.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.137.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.137.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.137.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.137.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.137.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.137.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.138.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.138.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.138.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.138.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.138.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.138.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.139.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.139.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.139.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.139.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.139.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.139.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.140.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.140.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.140.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.140.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.140.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.140.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.141.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.141.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.141.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.141.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.141.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.141.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.142.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.142.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.142.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.142.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.142.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.142.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.143.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.143.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.143.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.143.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.143.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.143.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.144.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.144.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.144.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.144.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.144.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.144.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.145.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.145.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.145.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.145.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.145.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.145.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.146.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.146.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.146.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.146.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.146.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.146.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.147.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.147.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.147.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.147.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.147.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.147.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.148.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.148.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.148.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.148.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.148.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.148.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.149.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.149.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.149.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.149.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.149.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.149.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.150.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.150.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.150.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.150.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.150.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.150.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.151.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.151.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.151.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.151.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.151.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.151.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.152.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.152.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.152.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.152.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.152.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.152.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.153.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.153.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.153.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.153.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.153.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.153.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.154.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.154.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.154.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.154.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.154.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.154.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.155.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.155.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.155.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.155.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.155.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.155.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.156.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.156.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.156.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.156.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.156.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.156.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.157.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.157.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.157.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.157.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.157.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.157.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.158.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.158.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.158.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.158.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.158.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.158.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.159.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.159.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.159.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.159.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.159.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.159.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.160.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.160.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.160.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.160.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.160.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.160.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.161.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.161.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.161.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.161.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.161.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.161.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.162.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.162.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.162.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.162.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.162.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.162.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.163.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.163.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.163.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.163.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.163.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.163.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.164.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.164.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.164.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.164.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.164.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.164.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.165.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.165.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.165.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.165.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.165.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.165.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.166.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.166.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.166.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.166.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.166.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.166.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.167.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.167.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.167.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.167.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.167.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.167.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.168.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.168.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.168.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.168.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.168.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.168.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.169.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.169.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.169.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.169.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.169.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.169.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.170.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.170.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.170.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.170.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.170.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.170.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.171.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.171.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.171.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.171.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.171.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.171.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.172.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.172.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.172.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.172.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.172.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.172.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.173.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.173.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.173.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.173.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.173.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.173.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.174.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.174.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.174.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.174.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.174.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.174.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.175.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.175.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.175.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.175.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.175.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.175.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.176.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.176.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.176.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.176.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.176.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.176.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.177.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.177.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.177.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.177.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.177.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.177.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.178.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.178.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.178.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.178.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.178.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.178.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.179.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.179.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.179.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.179.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.179.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.179.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.180.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.180.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.180.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.180.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.180.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.180.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.181.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.181.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.181.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.181.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.181.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.181.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.182.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.182.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.182.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.182.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.182.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.182.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.183.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.183.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.183.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.183.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.183.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.183.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.184.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.184.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.184.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.184.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.184.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.184.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.185.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.185.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.185.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.185.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.185.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.185.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.186.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.186.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.186.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.186.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.186.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.186.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.187.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.187.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.187.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.187.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.187.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.187.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.188.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.188.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.188.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.188.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.188.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.188.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.189.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.189.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.189.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.189.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.189.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.189.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.190.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.190.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.190.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.190.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.190.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.190.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.191.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.191.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.191.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.191.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.191.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.191.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.192.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.192.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.192.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.192.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.192.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.192.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.193.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.193.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.193.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.193.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.193.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.193.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.194.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.194.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.194.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.194.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.194.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.194.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.195.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.195.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.195.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.195.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.195.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.195.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.196.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.196.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.196.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.196.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.196.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.196.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.197.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.197.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.197.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.197.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.197.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.197.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.198.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.198.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.198.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.198.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.198.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.198.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.199.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.199.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.199.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.199.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.199.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.199.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.200.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.200.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.200.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.200.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.200.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.200.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.201.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.201.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.201.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.201.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.201.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.201.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.202.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.202.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.202.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.202.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.202.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.202.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.203.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.203.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.203.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.203.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.203.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.203.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.204.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.204.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.204.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.204.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.204.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.204.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.205.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.205.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.205.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.205.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.205.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.205.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.206.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.206.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.206.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.206.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.206.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.206.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.207.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.207.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.207.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.207.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.207.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.207.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.208.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.208.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.208.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.208.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.208.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.208.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.209.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.209.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.209.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.209.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.209.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.209.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.210.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.210.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.210.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.210.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.210.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.210.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.211.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.211.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.211.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.211.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.211.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.211.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.212.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.212.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.212.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.212.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.212.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.212.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.213.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.213.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.213.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.213.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.213.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.213.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.214.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.214.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.214.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.214.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.214.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.214.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.215.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.215.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.215.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.215.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.215.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.215.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.216.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.216.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.216.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.216.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.216.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.216.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.217.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.217.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.217.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.217.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.217.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.217.down_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.218.gate_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.218.gate_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.218.up_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.218.up_proj.weight_scale_inv": "model-00113-of-000163.safetensors", "model.layers.43.mlp.experts.218.down_proj.weight": "model-00113-of-000163.safetensors", - "model.layers.43.mlp.experts.218.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.219.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.219.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.219.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.219.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.219.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.219.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.220.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.220.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.220.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.220.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.220.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.220.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.221.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.221.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.221.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.221.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.221.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.221.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.222.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.222.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.222.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.222.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.222.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.222.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.223.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.223.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.223.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.223.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.223.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.223.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.224.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.224.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.224.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.224.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.224.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.224.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.225.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.225.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.225.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.225.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.225.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.225.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.226.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.226.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.226.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.226.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.226.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.226.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.227.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.227.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.227.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.227.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.227.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.227.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.228.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.228.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.228.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.228.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.228.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.228.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.229.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.229.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.229.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.229.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.229.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.229.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.230.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.230.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.230.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.230.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.230.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.230.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.231.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.231.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.231.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.231.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.231.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.231.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.232.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.232.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.232.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.232.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.232.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.232.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.233.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.233.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.233.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.233.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.233.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.233.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.234.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.234.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.234.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.234.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.234.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.234.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.235.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.235.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.235.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.235.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.235.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.235.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.236.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.236.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.236.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.236.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.236.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.236.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.237.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.237.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.237.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.237.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.237.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.237.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.238.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.238.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.238.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.238.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.238.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.238.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.239.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.239.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.239.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.239.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.239.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.239.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.240.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.240.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.240.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.240.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.240.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.240.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.241.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.241.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.241.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.241.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.241.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.241.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.242.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.242.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.242.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.242.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.242.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.242.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.243.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.243.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.243.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.243.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.243.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.243.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.244.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.244.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.244.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.244.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.244.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.244.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.245.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.245.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.245.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.245.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.245.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.245.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.246.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.246.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.246.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.246.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.246.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.246.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.247.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.247.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.247.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.247.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.247.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.247.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.248.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.248.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.248.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.248.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.248.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.248.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.249.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.249.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.249.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.249.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.249.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.249.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.250.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.250.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.250.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.250.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.250.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.250.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.251.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.251.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.251.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.251.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.251.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.251.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.252.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.252.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.252.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.252.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.252.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.252.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.253.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.253.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.253.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.253.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.253.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.253.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.254.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.254.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.254.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.254.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.254.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.254.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.255.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.255.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.255.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.255.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.mlp.experts.255.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.43.mlp.experts.255.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.43.input_layernorm.weight": "model-00114-of-000163.safetensors", "model.layers.43.post_attention_layernorm.weight": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.q_a_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.self_attn.q_a_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.q_a_layernorm.weight": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.q_b_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.self_attn.q_b_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.kv_a_proj_with_mqa.weight": "model-00114-of-000163.safetensors", - "model.layers.44.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.kv_a_layernorm.weight": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.kv_b_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.self_attn.kv_b_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.self_attn.o_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.self_attn.o_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.gate.weight": "model-00114-of-000163.safetensors", "model.layers.44.mlp.gate.e_score_correction_bias": "model-00114-of-000163.safetensors", "model.layers.44.mlp.shared_experts.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.shared_experts.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.shared_experts.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.shared_experts.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.shared_experts.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.0.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.0.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.0.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.0.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.0.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.0.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.1.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.1.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.1.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.1.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.1.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.1.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.2.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.2.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.2.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.2.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.2.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.2.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.3.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.3.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.3.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.3.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.3.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.3.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.4.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.4.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.4.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.4.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.4.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.4.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.5.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.5.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.5.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.5.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.5.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.5.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.6.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.6.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.6.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.6.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.6.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.6.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.7.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.7.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.7.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.7.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.7.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.7.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.8.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.8.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.8.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.8.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.8.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.8.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.9.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.9.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.9.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.9.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.9.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.9.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.10.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.10.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.10.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.10.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.10.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.10.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.11.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.11.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.11.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.11.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.11.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.11.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.12.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.12.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.12.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.12.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.12.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.12.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.13.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.13.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.13.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.13.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.13.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.13.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.14.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.14.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.14.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.14.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.14.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.14.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.15.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.15.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.15.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.15.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.15.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.15.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.16.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.16.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.16.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.16.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.16.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.16.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.17.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.17.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.17.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.17.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.17.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.17.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.18.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.18.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.18.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.18.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.18.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.18.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.19.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.19.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.19.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.19.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.19.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.19.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.20.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.20.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.20.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.20.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.20.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.20.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.21.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.21.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.21.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.21.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.21.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.21.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.22.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.22.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.22.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.22.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.22.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.22.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.23.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.23.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.23.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.23.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.23.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.23.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.24.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.24.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.24.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.24.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.24.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.24.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.25.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.25.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.25.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.25.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.25.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.25.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.26.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.26.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.26.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.26.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.26.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.26.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.27.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.27.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.27.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.27.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.27.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.27.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.28.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.28.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.28.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.28.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.28.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.28.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.29.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.29.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.29.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.29.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.29.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.29.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.30.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.30.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.30.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.30.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.30.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.30.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.31.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.31.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.31.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.31.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.31.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.31.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.32.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.32.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.32.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.32.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.32.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.32.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.33.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.33.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.33.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.33.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.33.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.33.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.34.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.34.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.34.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.34.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.34.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.34.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.35.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.35.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.35.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.35.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.35.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.35.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.36.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.36.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.36.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.36.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.36.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.36.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.37.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.37.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.37.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.37.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.37.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.37.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.38.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.38.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.38.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.38.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.38.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.38.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.39.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.39.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.39.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.39.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.39.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.39.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.40.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.40.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.40.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.40.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.40.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.40.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.41.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.41.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.41.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.41.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.41.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.41.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.42.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.42.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.42.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.42.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.42.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.42.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.43.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.43.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.43.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.43.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.43.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.43.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.44.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.44.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.44.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.44.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.44.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.44.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.45.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.45.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.45.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.45.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.45.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.45.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.46.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.46.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.46.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.46.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.46.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.46.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.47.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.47.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.47.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.47.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.47.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.47.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.48.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.48.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.48.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.48.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.48.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.48.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.49.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.49.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.49.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.49.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.49.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.49.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.50.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.50.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.50.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.50.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.50.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.50.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.51.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.51.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.51.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.51.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.51.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.51.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.52.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.52.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.52.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.52.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.52.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.52.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.53.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.53.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.53.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.53.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.53.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.53.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.54.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.54.gate_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.54.up_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.54.up_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.54.down_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.54.down_proj.weight_scale_inv": "model-00114-of-000163.safetensors", "model.layers.44.mlp.experts.55.gate_proj.weight": "model-00114-of-000163.safetensors", - "model.layers.44.mlp.experts.55.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.55.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.55.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.55.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.55.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.56.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.56.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.56.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.56.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.56.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.56.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.57.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.57.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.57.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.57.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.57.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.57.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.58.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.58.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.58.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.58.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.58.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.58.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.59.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.59.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.59.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.59.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.59.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.59.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.60.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.60.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.60.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.60.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.60.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.60.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.61.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.61.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.61.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.61.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.61.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.61.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.62.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.62.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.62.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.62.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.62.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.62.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.63.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.63.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.63.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.63.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.63.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.63.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.64.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.64.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.64.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.64.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.64.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.64.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.65.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.65.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.65.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.65.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.65.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.65.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.66.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.66.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.66.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.66.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.66.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.66.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.67.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.67.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.67.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.67.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.67.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.67.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.68.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.68.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.68.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.68.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.68.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.68.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.69.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.69.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.69.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.69.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.69.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.69.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.70.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.70.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.70.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.70.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.70.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.70.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.71.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.71.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.71.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.71.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.71.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.71.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.72.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.72.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.72.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.72.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.72.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.72.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.73.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.73.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.73.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.73.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.73.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.73.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.74.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.74.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.74.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.74.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.74.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.74.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.75.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.75.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.75.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.75.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.75.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.75.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.76.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.76.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.76.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.76.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.76.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.76.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.77.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.77.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.77.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.77.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.77.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.77.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.78.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.78.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.78.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.78.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.78.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.78.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.79.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.79.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.79.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.79.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.79.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.79.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.80.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.80.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.80.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.80.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.80.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.80.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.81.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.81.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.81.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.81.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.81.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.81.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.82.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.82.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.82.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.82.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.82.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.82.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.83.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.83.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.83.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.83.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.83.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.83.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.84.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.84.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.84.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.84.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.84.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.84.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.85.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.85.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.85.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.85.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.85.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.85.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.86.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.86.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.86.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.86.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.86.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.86.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.87.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.87.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.87.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.87.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.87.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.87.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.88.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.88.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.88.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.88.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.88.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.88.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.89.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.89.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.89.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.89.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.89.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.89.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.90.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.90.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.90.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.90.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.90.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.90.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.91.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.91.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.91.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.91.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.91.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.91.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.92.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.92.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.92.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.92.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.92.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.92.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.93.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.93.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.93.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.93.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.93.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.93.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.94.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.94.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.94.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.94.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.94.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.94.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.95.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.95.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.95.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.95.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.95.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.95.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.96.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.96.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.96.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.96.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.96.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.96.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.97.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.97.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.97.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.97.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.97.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.97.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.98.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.98.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.98.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.98.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.98.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.98.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.99.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.99.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.99.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.99.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.99.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.99.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.100.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.100.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.100.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.100.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.100.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.100.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.101.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.101.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.101.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.101.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.101.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.101.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.102.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.102.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.102.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.102.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.102.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.102.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.103.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.103.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.103.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.103.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.103.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.103.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.104.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.104.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.104.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.104.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.104.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.104.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.105.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.105.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.105.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.105.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.105.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.105.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.106.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.106.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.106.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.106.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.106.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.106.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.107.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.107.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.107.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.107.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.107.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.107.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.108.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.108.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.108.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.108.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.108.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.108.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.109.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.109.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.109.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.109.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.109.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.109.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.110.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.110.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.110.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.110.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.110.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.110.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.111.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.111.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.111.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.111.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.111.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.111.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.112.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.112.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.112.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.112.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.112.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.112.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.113.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.113.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.113.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.113.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.113.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.113.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.114.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.114.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.114.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.114.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.114.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.114.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.115.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.115.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.115.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.115.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.115.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.115.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.116.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.116.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.116.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.116.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.116.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.116.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.117.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.117.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.117.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.117.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.117.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.117.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.118.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.118.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.118.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.118.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.118.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.118.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.119.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.119.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.119.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.119.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.119.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.119.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.120.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.120.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.120.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.120.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.120.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.120.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.121.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.121.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.121.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.121.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.121.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.121.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.122.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.122.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.122.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.122.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.122.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.122.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.123.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.123.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.123.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.123.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.123.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.123.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.124.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.124.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.124.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.124.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.124.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.124.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.125.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.125.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.125.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.125.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.125.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.125.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.126.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.126.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.126.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.126.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.126.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.126.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.127.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.127.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.127.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.127.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.127.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.127.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.128.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.128.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.128.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.128.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.128.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.128.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.129.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.129.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.129.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.129.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.129.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.129.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.130.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.130.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.130.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.130.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.130.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.130.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.131.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.131.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.131.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.131.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.131.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.131.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.132.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.132.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.132.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.132.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.132.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.132.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.133.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.133.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.133.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.133.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.133.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.133.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.134.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.134.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.134.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.134.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.134.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.134.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.135.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.135.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.135.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.135.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.135.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.135.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.136.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.136.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.136.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.136.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.136.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.136.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.137.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.137.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.137.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.137.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.137.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.137.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.138.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.138.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.138.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.138.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.138.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.138.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.139.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.139.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.139.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.139.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.139.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.139.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.140.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.140.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.140.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.140.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.140.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.140.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.141.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.141.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.141.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.141.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.141.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.141.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.142.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.142.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.142.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.142.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.142.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.142.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.143.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.143.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.143.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.143.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.143.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.143.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.144.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.144.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.144.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.144.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.144.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.144.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.145.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.145.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.145.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.145.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.145.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.145.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.146.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.146.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.146.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.146.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.146.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.146.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.147.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.147.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.147.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.147.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.147.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.147.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.148.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.148.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.148.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.148.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.148.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.148.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.149.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.149.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.149.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.149.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.149.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.149.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.150.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.150.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.150.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.150.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.150.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.150.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.151.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.151.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.151.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.151.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.151.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.151.down_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.152.gate_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.152.gate_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.152.up_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.152.up_proj.weight_scale_inv": "model-00115-of-000163.safetensors", "model.layers.44.mlp.experts.152.down_proj.weight": "model-00115-of-000163.safetensors", - "model.layers.44.mlp.experts.152.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.153.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.153.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.153.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.153.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.153.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.153.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.154.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.154.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.154.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.154.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.154.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.154.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.155.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.155.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.155.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.155.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.155.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.155.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.156.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.156.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.156.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.156.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.156.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.156.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.157.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.157.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.157.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.157.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.157.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.157.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.158.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.158.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.158.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.158.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.158.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.158.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.159.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.159.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.159.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.159.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.159.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.159.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.160.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.160.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.160.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.160.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.160.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.160.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.161.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.161.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.161.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.161.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.161.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.161.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.162.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.162.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.162.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.162.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.162.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.162.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.163.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.163.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.163.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.163.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.163.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.163.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.164.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.164.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.164.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.164.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.164.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.164.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.165.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.165.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.165.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.165.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.165.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.165.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.166.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.166.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.166.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.166.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.166.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.166.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.167.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.167.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.167.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.167.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.167.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.167.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.168.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.168.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.168.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.168.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.168.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.168.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.169.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.169.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.169.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.169.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.169.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.169.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.170.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.170.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.170.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.170.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.170.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.170.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.171.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.171.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.171.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.171.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.171.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.171.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.172.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.172.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.172.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.172.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.172.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.172.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.173.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.173.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.173.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.173.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.173.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.173.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.174.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.174.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.174.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.174.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.174.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.174.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.175.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.175.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.175.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.175.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.175.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.175.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.176.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.176.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.176.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.176.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.176.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.176.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.177.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.177.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.177.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.177.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.177.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.177.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.178.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.178.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.178.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.178.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.178.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.178.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.179.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.179.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.179.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.179.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.179.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.179.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.180.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.180.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.180.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.180.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.180.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.180.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.181.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.181.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.181.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.181.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.181.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.181.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.182.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.182.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.182.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.182.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.182.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.182.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.183.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.183.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.183.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.183.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.183.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.183.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.184.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.184.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.184.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.184.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.184.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.184.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.185.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.185.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.185.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.185.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.185.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.185.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.186.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.186.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.186.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.186.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.186.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.186.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.187.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.187.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.187.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.187.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.187.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.187.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.188.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.188.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.188.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.188.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.188.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.188.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.189.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.189.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.189.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.189.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.189.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.189.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.190.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.190.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.190.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.190.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.190.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.190.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.191.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.191.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.191.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.191.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.191.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.191.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.192.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.192.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.192.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.192.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.192.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.192.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.193.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.193.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.193.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.193.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.193.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.193.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.194.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.194.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.194.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.194.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.194.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.194.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.195.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.195.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.195.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.195.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.195.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.195.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.196.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.196.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.196.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.196.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.196.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.196.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.197.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.197.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.197.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.197.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.197.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.197.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.198.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.198.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.198.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.198.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.198.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.198.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.199.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.199.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.199.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.199.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.199.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.199.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.200.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.200.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.200.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.200.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.200.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.200.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.201.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.201.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.201.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.201.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.201.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.201.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.202.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.202.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.202.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.202.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.202.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.202.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.203.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.203.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.203.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.203.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.203.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.203.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.204.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.204.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.204.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.204.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.204.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.204.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.205.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.205.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.205.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.205.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.205.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.205.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.206.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.206.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.206.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.206.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.206.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.206.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.207.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.207.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.207.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.207.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.207.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.207.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.208.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.208.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.208.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.208.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.208.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.208.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.209.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.209.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.209.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.209.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.209.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.209.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.210.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.210.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.210.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.210.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.210.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.210.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.211.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.211.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.211.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.211.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.211.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.211.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.212.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.212.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.212.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.212.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.212.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.212.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.213.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.213.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.213.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.213.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.213.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.213.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.214.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.214.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.214.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.214.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.214.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.214.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.215.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.215.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.215.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.215.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.215.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.215.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.216.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.216.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.216.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.216.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.216.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.216.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.217.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.217.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.217.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.217.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.217.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.217.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.218.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.218.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.218.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.218.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.218.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.218.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.219.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.219.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.219.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.219.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.219.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.219.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.220.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.220.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.220.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.220.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.220.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.220.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.221.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.221.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.221.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.221.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.221.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.221.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.222.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.222.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.222.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.222.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.222.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.222.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.223.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.223.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.223.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.223.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.223.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.223.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.224.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.224.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.224.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.224.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.224.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.224.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.225.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.225.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.225.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.225.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.225.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.225.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.226.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.226.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.226.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.226.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.226.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.226.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.227.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.227.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.227.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.227.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.227.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.227.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.228.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.228.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.228.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.228.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.228.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.228.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.229.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.229.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.229.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.229.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.229.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.229.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.230.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.230.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.230.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.230.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.230.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.230.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.231.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.231.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.231.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.231.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.231.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.231.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.232.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.232.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.232.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.232.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.232.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.232.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.233.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.233.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.233.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.233.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.233.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.233.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.234.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.234.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.234.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.234.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.234.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.234.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.235.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.235.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.235.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.235.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.235.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.235.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.236.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.236.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.236.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.236.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.236.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.236.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.237.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.237.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.237.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.237.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.237.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.237.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.238.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.238.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.238.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.238.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.238.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.238.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.239.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.239.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.239.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.239.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.239.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.239.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.240.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.240.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.240.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.240.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.240.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.240.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.241.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.241.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.241.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.241.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.241.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.241.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.242.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.242.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.242.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.242.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.242.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.242.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.243.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.243.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.243.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.243.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.243.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.243.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.244.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.244.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.244.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.244.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.244.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.244.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.245.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.245.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.245.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.245.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.245.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.245.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.246.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.246.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.246.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.246.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.246.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.246.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.247.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.247.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.247.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.247.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.247.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.247.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.248.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.248.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.248.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.248.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.248.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.248.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.249.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.249.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.249.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.249.up_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.249.down_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.249.down_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.250.gate_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.250.gate_proj.weight_scale_inv": "model-00116-of-000163.safetensors", "model.layers.44.mlp.experts.250.up_proj.weight": "model-00116-of-000163.safetensors", - "model.layers.44.mlp.experts.250.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.250.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.250.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.251.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.251.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.251.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.251.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.251.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.251.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.252.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.252.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.252.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.252.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.252.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.252.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.253.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.253.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.253.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.253.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.253.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.253.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.254.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.254.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.254.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.254.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.254.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.254.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.255.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.255.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.255.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.255.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.mlp.experts.255.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.44.mlp.experts.255.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.44.input_layernorm.weight": "model-00117-of-000163.safetensors", "model.layers.44.post_attention_layernorm.weight": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.q_a_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.self_attn.q_a_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.q_a_layernorm.weight": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.q_b_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.self_attn.q_b_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.kv_a_proj_with_mqa.weight": "model-00117-of-000163.safetensors", - "model.layers.45.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.kv_a_layernorm.weight": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.kv_b_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.self_attn.kv_b_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.self_attn.o_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.self_attn.o_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.gate.weight": "model-00117-of-000163.safetensors", "model.layers.45.mlp.gate.e_score_correction_bias": "model-00117-of-000163.safetensors", "model.layers.45.mlp.shared_experts.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.shared_experts.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.shared_experts.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.shared_experts.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.shared_experts.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.0.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.0.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.0.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.0.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.0.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.0.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.1.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.1.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.1.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.1.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.1.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.1.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.2.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.2.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.2.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.2.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.2.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.2.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.3.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.3.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.3.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.3.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.3.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.3.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.4.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.4.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.4.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.4.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.4.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.4.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.5.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.5.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.5.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.5.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.5.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.5.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.6.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.6.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.6.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.6.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.6.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.6.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.7.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.7.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.7.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.7.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.7.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.7.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.8.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.8.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.8.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.8.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.8.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.8.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.9.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.9.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.9.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.9.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.9.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.9.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.10.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.10.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.10.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.10.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.10.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.10.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.11.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.11.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.11.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.11.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.11.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.11.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.12.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.12.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.12.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.12.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.12.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.12.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.13.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.13.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.13.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.13.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.13.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.13.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.14.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.14.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.14.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.14.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.14.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.14.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.15.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.15.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.15.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.15.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.15.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.15.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.16.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.16.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.16.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.16.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.16.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.16.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.17.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.17.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.17.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.17.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.17.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.17.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.18.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.18.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.18.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.18.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.18.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.18.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.19.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.19.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.19.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.19.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.19.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.19.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.20.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.20.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.20.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.20.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.20.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.20.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.21.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.21.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.21.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.21.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.21.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.21.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.22.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.22.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.22.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.22.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.22.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.22.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.23.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.23.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.23.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.23.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.23.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.23.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.24.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.24.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.24.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.24.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.24.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.24.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.25.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.25.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.25.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.25.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.25.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.25.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.26.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.26.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.26.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.26.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.26.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.26.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.27.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.27.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.27.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.27.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.27.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.27.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.28.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.28.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.28.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.28.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.28.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.28.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.29.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.29.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.29.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.29.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.29.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.29.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.30.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.30.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.30.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.30.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.30.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.30.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.31.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.31.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.31.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.31.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.31.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.31.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.32.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.32.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.32.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.32.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.32.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.32.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.33.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.33.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.33.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.33.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.33.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.33.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.34.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.34.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.34.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.34.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.34.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.34.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.35.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.35.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.35.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.35.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.35.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.35.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.36.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.36.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.36.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.36.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.36.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.36.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.37.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.37.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.37.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.37.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.37.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.37.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.38.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.38.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.38.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.38.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.38.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.38.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.39.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.39.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.39.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.39.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.39.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.39.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.40.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.40.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.40.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.40.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.40.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.40.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.41.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.41.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.41.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.41.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.41.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.41.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.42.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.42.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.42.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.42.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.42.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.42.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.43.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.43.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.43.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.43.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.43.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.43.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.44.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.44.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.44.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.44.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.44.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.44.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.45.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.45.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.45.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.45.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.45.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.45.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.46.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.46.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.46.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.46.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.46.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.46.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.47.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.47.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.47.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.47.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.47.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.47.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.48.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.48.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.48.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.48.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.48.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.48.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.49.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.49.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.49.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.49.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.49.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.49.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.50.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.50.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.50.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.50.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.50.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.50.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.51.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.51.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.51.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.51.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.51.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.51.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.52.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.52.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.52.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.52.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.52.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.52.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.53.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.53.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.53.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.53.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.53.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.53.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.54.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.54.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.54.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.54.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.54.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.54.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.55.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.55.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.55.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.55.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.55.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.55.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.56.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.56.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.56.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.56.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.56.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.56.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.57.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.57.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.57.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.57.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.57.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.57.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.58.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.58.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.58.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.58.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.58.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.58.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.59.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.59.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.59.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.59.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.59.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.59.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.60.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.60.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.60.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.60.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.60.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.60.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.61.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.61.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.61.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.61.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.61.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.61.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.62.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.62.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.62.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.62.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.62.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.62.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.63.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.63.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.63.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.63.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.63.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.63.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.64.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.64.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.64.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.64.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.64.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.64.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.65.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.65.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.65.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.65.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.65.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.65.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.66.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.66.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.66.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.66.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.66.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.66.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.67.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.67.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.67.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.67.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.67.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.67.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.68.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.68.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.68.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.68.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.68.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.68.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.69.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.69.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.69.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.69.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.69.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.69.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.70.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.70.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.70.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.70.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.70.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.70.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.71.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.71.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.71.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.71.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.71.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.71.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.72.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.72.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.72.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.72.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.72.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.72.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.73.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.73.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.73.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.73.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.73.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.73.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.74.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.74.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.74.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.74.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.74.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.74.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.75.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.75.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.75.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.75.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.75.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.75.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.76.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.76.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.76.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.76.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.76.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.76.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.77.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.77.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.77.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.77.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.77.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.77.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.78.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.78.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.78.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.78.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.78.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.78.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.79.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.79.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.79.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.79.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.79.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.79.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.80.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.80.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.80.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.80.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.80.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.80.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.81.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.81.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.81.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.81.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.81.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.81.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.82.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.82.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.82.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.82.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.82.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.82.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.83.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.83.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.83.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.83.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.83.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.83.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.84.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.84.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.84.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.84.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.84.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.84.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.85.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.85.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.85.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.85.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.85.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.85.down_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.86.gate_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.86.gate_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.86.up_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.86.up_proj.weight_scale_inv": "model-00117-of-000163.safetensors", "model.layers.45.mlp.experts.86.down_proj.weight": "model-00117-of-000163.safetensors", - "model.layers.45.mlp.experts.86.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.87.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.87.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.87.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.87.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.87.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.87.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.88.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.88.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.88.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.88.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.88.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.88.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.89.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.89.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.89.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.89.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.89.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.89.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.90.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.90.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.90.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.90.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.90.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.90.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.91.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.91.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.91.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.91.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.91.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.91.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.92.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.92.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.92.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.92.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.92.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.92.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.93.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.93.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.93.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.93.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.93.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.93.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.94.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.94.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.94.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.94.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.94.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.94.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.95.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.95.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.95.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.95.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.95.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.95.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.96.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.96.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.96.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.96.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.96.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.96.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.97.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.97.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.97.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.97.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.97.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.97.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.98.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.98.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.98.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.98.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.98.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.98.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.99.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.99.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.99.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.99.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.99.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.99.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.100.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.100.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.100.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.100.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.100.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.100.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.101.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.101.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.101.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.101.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.101.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.101.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.102.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.102.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.102.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.102.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.102.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.102.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.103.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.103.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.103.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.103.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.103.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.103.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.104.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.104.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.104.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.104.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.104.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.104.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.105.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.105.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.105.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.105.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.105.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.105.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.106.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.106.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.106.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.106.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.106.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.106.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.107.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.107.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.107.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.107.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.107.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.107.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.108.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.108.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.108.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.108.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.108.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.108.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.109.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.109.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.109.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.109.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.109.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.109.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.110.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.110.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.110.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.110.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.110.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.110.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.111.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.111.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.111.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.111.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.111.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.111.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.112.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.112.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.112.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.112.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.112.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.112.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.113.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.113.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.113.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.113.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.113.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.113.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.114.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.114.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.114.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.114.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.114.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.114.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.115.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.115.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.115.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.115.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.115.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.115.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.116.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.116.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.116.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.116.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.116.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.116.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.117.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.117.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.117.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.117.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.117.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.117.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.118.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.118.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.118.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.118.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.118.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.118.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.119.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.119.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.119.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.119.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.119.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.119.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.120.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.120.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.120.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.120.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.120.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.120.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.121.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.121.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.121.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.121.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.121.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.121.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.122.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.122.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.122.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.122.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.122.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.122.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.123.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.123.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.123.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.123.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.123.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.123.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.124.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.124.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.124.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.124.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.124.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.124.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.125.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.125.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.125.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.125.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.125.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.125.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.126.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.126.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.126.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.126.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.126.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.126.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.127.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.127.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.127.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.127.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.127.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.127.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.128.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.128.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.128.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.128.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.128.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.128.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.129.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.129.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.129.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.129.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.129.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.129.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.130.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.130.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.130.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.130.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.130.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.130.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.131.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.131.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.131.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.131.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.131.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.131.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.132.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.132.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.132.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.132.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.132.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.132.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.133.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.133.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.133.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.133.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.133.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.133.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.134.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.134.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.134.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.134.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.134.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.134.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.135.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.135.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.135.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.135.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.135.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.135.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.136.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.136.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.136.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.136.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.136.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.136.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.137.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.137.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.137.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.137.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.137.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.137.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.138.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.138.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.138.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.138.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.138.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.138.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.139.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.139.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.139.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.139.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.139.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.139.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.140.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.140.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.140.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.140.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.140.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.140.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.141.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.141.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.141.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.141.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.141.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.141.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.142.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.142.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.142.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.142.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.142.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.142.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.143.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.143.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.143.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.143.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.143.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.143.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.144.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.144.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.144.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.144.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.144.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.144.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.145.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.145.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.145.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.145.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.145.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.145.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.146.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.146.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.146.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.146.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.146.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.146.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.147.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.147.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.147.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.147.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.147.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.147.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.148.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.148.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.148.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.148.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.148.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.148.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.149.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.149.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.149.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.149.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.149.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.149.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.150.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.150.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.150.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.150.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.150.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.150.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.151.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.151.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.151.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.151.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.151.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.151.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.152.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.152.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.152.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.152.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.152.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.152.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.153.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.153.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.153.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.153.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.153.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.153.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.154.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.154.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.154.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.154.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.154.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.154.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.155.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.155.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.155.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.155.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.155.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.155.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.156.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.156.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.156.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.156.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.156.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.156.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.157.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.157.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.157.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.157.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.157.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.157.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.158.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.158.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.158.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.158.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.158.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.158.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.159.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.159.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.159.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.159.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.159.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.159.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.160.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.160.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.160.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.160.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.160.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.160.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.161.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.161.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.161.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.161.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.161.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.161.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.162.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.162.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.162.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.162.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.162.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.162.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.163.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.163.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.163.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.163.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.163.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.163.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.164.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.164.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.164.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.164.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.164.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.164.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.165.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.165.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.165.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.165.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.165.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.165.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.166.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.166.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.166.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.166.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.166.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.166.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.167.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.167.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.167.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.167.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.167.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.167.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.168.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.168.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.168.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.168.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.168.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.168.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.169.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.169.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.169.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.169.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.169.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.169.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.170.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.170.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.170.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.170.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.170.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.170.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.171.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.171.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.171.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.171.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.171.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.171.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.172.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.172.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.172.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.172.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.172.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.172.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.173.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.173.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.173.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.173.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.173.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.173.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.174.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.174.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.174.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.174.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.174.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.174.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.175.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.175.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.175.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.175.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.175.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.175.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.176.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.176.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.176.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.176.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.176.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.176.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.177.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.177.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.177.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.177.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.177.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.177.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.178.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.178.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.178.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.178.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.178.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.178.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.179.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.179.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.179.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.179.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.179.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.179.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.180.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.180.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.180.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.180.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.180.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.180.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.181.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.181.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.181.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.181.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.181.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.181.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.182.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.182.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.182.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.182.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.182.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.182.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.183.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.183.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.183.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.183.up_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.183.down_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.183.down_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.184.gate_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.184.gate_proj.weight_scale_inv": "model-00118-of-000163.safetensors", "model.layers.45.mlp.experts.184.up_proj.weight": "model-00118-of-000163.safetensors", - "model.layers.45.mlp.experts.184.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.184.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.184.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.185.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.185.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.185.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.185.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.185.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.185.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.186.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.186.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.186.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.186.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.186.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.186.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.187.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.187.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.187.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.187.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.187.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.187.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.188.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.188.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.188.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.188.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.188.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.188.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.189.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.189.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.189.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.189.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.189.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.189.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.190.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.190.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.190.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.190.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.190.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.190.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.191.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.191.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.191.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.191.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.191.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.191.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.192.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.192.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.192.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.192.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.192.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.192.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.193.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.193.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.193.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.193.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.193.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.193.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.194.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.194.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.194.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.194.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.194.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.194.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.195.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.195.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.195.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.195.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.195.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.195.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.196.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.196.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.196.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.196.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.196.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.196.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.197.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.197.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.197.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.197.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.197.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.197.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.198.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.198.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.198.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.198.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.198.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.198.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.199.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.199.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.199.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.199.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.199.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.199.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.200.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.200.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.200.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.200.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.200.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.200.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.201.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.201.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.201.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.201.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.201.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.201.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.202.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.202.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.202.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.202.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.202.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.202.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.203.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.203.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.203.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.203.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.203.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.203.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.204.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.204.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.204.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.204.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.204.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.204.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.205.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.205.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.205.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.205.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.205.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.205.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.206.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.206.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.206.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.206.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.206.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.206.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.207.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.207.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.207.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.207.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.207.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.207.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.208.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.208.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.208.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.208.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.208.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.208.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.209.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.209.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.209.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.209.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.209.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.209.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.210.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.210.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.210.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.210.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.210.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.210.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.211.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.211.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.211.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.211.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.211.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.211.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.212.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.212.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.212.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.212.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.212.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.212.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.213.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.213.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.213.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.213.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.213.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.213.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.214.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.214.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.214.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.214.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.214.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.214.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.215.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.215.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.215.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.215.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.215.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.215.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.216.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.216.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.216.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.216.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.216.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.216.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.217.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.217.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.217.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.217.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.217.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.217.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.218.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.218.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.218.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.218.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.218.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.218.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.219.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.219.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.219.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.219.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.219.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.219.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.220.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.220.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.220.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.220.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.220.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.220.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.221.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.221.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.221.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.221.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.221.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.221.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.222.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.222.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.222.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.222.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.222.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.222.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.223.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.223.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.223.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.223.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.223.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.223.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.224.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.224.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.224.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.224.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.224.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.224.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.225.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.225.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.225.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.225.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.225.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.225.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.226.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.226.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.226.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.226.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.226.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.226.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.227.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.227.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.227.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.227.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.227.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.227.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.228.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.228.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.228.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.228.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.228.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.228.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.229.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.229.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.229.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.229.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.229.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.229.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.230.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.230.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.230.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.230.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.230.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.230.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.231.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.231.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.231.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.231.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.231.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.231.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.232.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.232.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.232.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.232.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.232.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.232.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.233.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.233.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.233.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.233.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.233.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.233.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.234.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.234.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.234.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.234.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.234.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.234.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.235.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.235.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.235.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.235.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.235.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.235.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.236.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.236.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.236.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.236.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.236.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.236.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.237.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.237.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.237.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.237.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.237.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.237.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.238.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.238.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.238.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.238.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.238.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.238.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.239.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.239.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.239.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.239.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.239.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.239.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.240.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.240.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.240.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.240.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.240.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.240.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.241.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.241.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.241.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.241.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.241.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.241.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.242.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.242.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.242.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.242.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.242.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.242.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.243.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.243.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.243.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.243.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.243.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.243.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.244.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.244.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.244.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.244.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.244.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.244.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.245.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.245.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.245.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.245.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.245.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.245.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.246.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.246.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.246.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.246.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.246.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.246.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.247.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.247.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.247.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.247.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.247.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.247.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.248.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.248.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.248.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.248.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.248.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.248.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.249.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.249.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.249.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.249.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.249.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.249.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.250.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.250.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.250.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.250.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.250.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.250.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.251.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.251.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.251.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.251.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.251.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.251.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.252.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.252.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.252.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.252.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.252.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.252.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.253.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.253.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.253.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.253.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.253.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.253.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.254.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.254.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.254.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.254.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.254.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.254.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.255.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.255.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.255.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.255.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.mlp.experts.255.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.45.mlp.experts.255.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.45.input_layernorm.weight": "model-00119-of-000163.safetensors", "model.layers.45.post_attention_layernorm.weight": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.q_a_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.self_attn.q_a_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.q_a_layernorm.weight": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.q_b_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.self_attn.q_b_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.kv_a_proj_with_mqa.weight": "model-00119-of-000163.safetensors", - "model.layers.46.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.kv_a_layernorm.weight": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.kv_b_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.self_attn.kv_b_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.self_attn.o_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.self_attn.o_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.gate.weight": "model-00119-of-000163.safetensors", "model.layers.46.mlp.gate.e_score_correction_bias": "model-00119-of-000163.safetensors", "model.layers.46.mlp.shared_experts.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.shared_experts.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.shared_experts.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.shared_experts.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.shared_experts.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.0.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.0.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.0.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.0.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.0.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.0.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.1.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.1.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.1.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.1.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.1.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.1.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.2.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.2.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.2.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.2.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.2.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.2.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.3.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.3.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.3.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.3.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.3.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.3.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.4.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.4.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.4.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.4.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.4.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.4.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.5.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.5.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.5.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.5.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.5.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.5.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.6.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.6.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.6.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.6.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.6.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.6.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.7.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.7.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.7.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.7.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.7.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.7.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.8.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.8.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.8.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.8.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.8.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.8.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.9.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.9.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.9.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.9.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.9.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.9.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.10.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.10.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.10.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.10.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.10.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.10.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.11.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.11.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.11.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.11.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.11.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.11.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.12.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.12.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.12.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.12.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.12.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.12.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.13.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.13.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.13.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.13.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.13.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.13.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.14.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.14.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.14.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.14.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.14.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.14.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.15.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.15.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.15.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.15.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.15.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.15.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.16.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.16.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.16.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.16.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.16.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.16.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.17.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.17.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.17.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.17.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.17.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.17.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.18.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.18.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.18.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.18.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.18.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.18.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.19.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.19.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.19.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.19.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.19.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.19.down_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.20.gate_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.20.gate_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.20.up_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.20.up_proj.weight_scale_inv": "model-00119-of-000163.safetensors", "model.layers.46.mlp.experts.20.down_proj.weight": "model-00119-of-000163.safetensors", - "model.layers.46.mlp.experts.20.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.21.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.21.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.21.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.21.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.21.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.21.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.22.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.22.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.22.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.22.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.22.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.22.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.23.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.23.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.23.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.23.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.23.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.23.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.24.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.24.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.24.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.24.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.24.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.24.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.25.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.25.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.25.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.25.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.25.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.25.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.26.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.26.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.26.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.26.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.26.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.26.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.27.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.27.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.27.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.27.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.27.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.27.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.28.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.28.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.28.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.28.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.28.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.28.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.29.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.29.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.29.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.29.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.29.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.29.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.30.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.30.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.30.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.30.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.30.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.30.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.31.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.31.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.31.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.31.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.31.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.31.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.32.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.32.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.32.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.32.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.32.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.32.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.33.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.33.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.33.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.33.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.33.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.33.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.34.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.34.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.34.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.34.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.34.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.34.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.35.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.35.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.35.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.35.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.35.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.35.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.36.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.36.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.36.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.36.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.36.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.36.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.37.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.37.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.37.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.37.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.37.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.37.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.38.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.38.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.38.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.38.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.38.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.38.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.39.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.39.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.39.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.39.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.39.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.39.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.40.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.40.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.40.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.40.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.40.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.40.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.41.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.41.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.41.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.41.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.41.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.41.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.42.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.42.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.42.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.42.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.42.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.42.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.43.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.43.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.43.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.43.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.43.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.43.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.44.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.44.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.44.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.44.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.44.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.44.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.45.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.45.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.45.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.45.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.45.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.45.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.46.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.46.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.46.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.46.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.46.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.46.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.47.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.47.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.47.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.47.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.47.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.47.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.48.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.48.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.48.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.48.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.48.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.48.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.49.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.49.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.49.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.49.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.49.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.49.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.50.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.50.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.50.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.50.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.50.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.50.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.51.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.51.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.51.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.51.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.51.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.51.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.52.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.52.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.52.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.52.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.52.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.52.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.53.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.53.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.53.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.53.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.53.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.53.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.54.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.54.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.54.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.54.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.54.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.54.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.55.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.55.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.55.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.55.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.55.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.55.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.56.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.56.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.56.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.56.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.56.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.56.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.57.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.57.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.57.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.57.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.57.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.57.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.58.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.58.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.58.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.58.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.58.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.58.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.59.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.59.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.59.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.59.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.59.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.59.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.60.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.60.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.60.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.60.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.60.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.60.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.61.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.61.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.61.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.61.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.61.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.61.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.62.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.62.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.62.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.62.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.62.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.62.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.63.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.63.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.63.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.63.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.63.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.63.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.64.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.64.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.64.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.64.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.64.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.64.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.65.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.65.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.65.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.65.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.65.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.65.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.66.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.66.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.66.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.66.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.66.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.66.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.67.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.67.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.67.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.67.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.67.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.67.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.68.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.68.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.68.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.68.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.68.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.68.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.69.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.69.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.69.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.69.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.69.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.69.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.70.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.70.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.70.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.70.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.70.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.70.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.71.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.71.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.71.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.71.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.71.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.71.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.72.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.72.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.72.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.72.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.72.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.72.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.73.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.73.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.73.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.73.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.73.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.73.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.74.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.74.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.74.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.74.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.74.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.74.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.75.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.75.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.75.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.75.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.75.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.75.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.76.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.76.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.76.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.76.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.76.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.76.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.77.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.77.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.77.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.77.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.77.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.77.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.78.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.78.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.78.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.78.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.78.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.78.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.79.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.79.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.79.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.79.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.79.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.79.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.80.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.80.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.80.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.80.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.80.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.80.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.81.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.81.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.81.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.81.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.81.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.81.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.82.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.82.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.82.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.82.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.82.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.82.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.83.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.83.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.83.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.83.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.83.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.83.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.84.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.84.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.84.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.84.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.84.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.84.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.85.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.85.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.85.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.85.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.85.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.85.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.86.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.86.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.86.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.86.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.86.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.86.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.87.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.87.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.87.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.87.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.87.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.87.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.88.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.88.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.88.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.88.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.88.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.88.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.89.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.89.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.89.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.89.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.89.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.89.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.90.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.90.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.90.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.90.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.90.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.90.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.91.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.91.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.91.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.91.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.91.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.91.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.92.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.92.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.92.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.92.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.92.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.92.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.93.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.93.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.93.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.93.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.93.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.93.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.94.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.94.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.94.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.94.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.94.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.94.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.95.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.95.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.95.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.95.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.95.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.95.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.96.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.96.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.96.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.96.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.96.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.96.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.97.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.97.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.97.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.97.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.97.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.97.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.98.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.98.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.98.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.98.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.98.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.98.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.99.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.99.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.99.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.99.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.99.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.99.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.100.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.100.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.100.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.100.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.100.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.100.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.101.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.101.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.101.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.101.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.101.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.101.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.102.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.102.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.102.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.102.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.102.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.102.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.103.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.103.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.103.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.103.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.103.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.103.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.104.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.104.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.104.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.104.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.104.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.104.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.105.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.105.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.105.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.105.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.105.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.105.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.106.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.106.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.106.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.106.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.106.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.106.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.107.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.107.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.107.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.107.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.107.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.107.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.108.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.108.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.108.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.108.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.108.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.108.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.109.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.109.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.109.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.109.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.109.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.109.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.110.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.110.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.110.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.110.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.110.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.110.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.111.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.111.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.111.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.111.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.111.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.111.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.112.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.112.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.112.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.112.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.112.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.112.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.113.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.113.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.113.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.113.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.113.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.113.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.114.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.114.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.114.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.114.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.114.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.114.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.115.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.115.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.115.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.115.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.115.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.115.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.116.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.116.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.116.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.116.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.116.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.116.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.117.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.117.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.117.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.117.up_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.117.down_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.117.down_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.118.gate_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.118.gate_proj.weight_scale_inv": "model-00120-of-000163.safetensors", "model.layers.46.mlp.experts.118.up_proj.weight": "model-00120-of-000163.safetensors", - "model.layers.46.mlp.experts.118.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.118.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.118.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.119.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.119.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.119.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.119.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.119.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.119.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.120.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.120.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.120.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.120.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.120.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.120.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.121.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.121.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.121.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.121.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.121.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.121.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.122.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.122.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.122.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.122.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.122.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.122.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.123.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.123.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.123.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.123.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.123.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.123.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.124.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.124.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.124.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.124.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.124.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.124.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.125.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.125.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.125.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.125.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.125.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.125.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.126.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.126.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.126.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.126.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.126.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.126.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.127.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.127.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.127.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.127.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.127.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.127.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.128.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.128.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.128.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.128.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.128.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.128.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.129.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.129.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.129.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.129.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.129.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.129.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.130.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.130.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.130.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.130.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.130.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.130.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.131.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.131.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.131.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.131.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.131.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.131.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.132.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.132.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.132.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.132.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.132.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.132.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.133.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.133.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.133.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.133.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.133.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.133.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.134.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.134.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.134.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.134.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.134.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.134.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.135.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.135.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.135.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.135.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.135.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.135.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.136.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.136.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.136.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.136.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.136.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.136.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.137.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.137.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.137.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.137.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.137.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.137.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.138.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.138.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.138.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.138.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.138.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.138.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.139.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.139.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.139.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.139.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.139.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.139.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.140.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.140.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.140.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.140.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.140.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.140.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.141.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.141.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.141.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.141.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.141.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.141.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.142.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.142.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.142.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.142.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.142.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.142.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.143.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.143.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.143.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.143.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.143.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.143.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.144.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.144.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.144.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.144.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.144.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.144.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.145.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.145.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.145.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.145.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.145.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.145.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.146.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.146.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.146.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.146.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.146.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.146.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.147.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.147.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.147.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.147.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.147.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.147.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.148.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.148.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.148.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.148.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.148.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.148.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.149.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.149.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.149.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.149.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.149.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.149.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.150.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.150.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.150.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.150.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.150.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.150.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.151.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.151.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.151.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.151.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.151.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.151.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.152.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.152.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.152.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.152.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.152.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.152.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.153.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.153.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.153.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.153.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.153.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.153.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.154.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.154.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.154.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.154.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.154.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.154.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.155.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.155.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.155.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.155.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.155.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.155.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.156.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.156.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.156.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.156.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.156.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.156.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.157.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.157.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.157.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.157.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.157.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.157.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.158.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.158.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.158.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.158.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.158.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.158.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.159.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.159.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.159.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.159.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.159.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.159.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.160.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.160.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.160.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.160.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.160.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.160.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.161.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.161.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.161.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.161.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.161.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.161.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.162.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.162.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.162.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.162.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.162.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.162.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.163.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.163.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.163.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.163.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.163.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.163.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.164.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.164.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.164.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.164.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.164.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.164.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.165.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.165.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.165.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.165.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.165.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.165.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.166.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.166.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.166.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.166.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.166.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.166.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.167.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.167.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.167.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.167.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.167.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.167.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.168.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.168.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.168.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.168.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.168.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.168.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.169.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.169.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.169.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.169.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.169.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.169.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.170.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.170.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.170.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.170.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.170.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.170.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.171.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.171.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.171.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.171.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.171.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.171.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.172.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.172.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.172.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.172.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.172.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.172.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.173.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.173.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.173.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.173.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.173.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.173.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.174.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.174.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.174.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.174.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.174.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.174.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.175.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.175.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.175.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.175.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.175.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.175.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.176.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.176.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.176.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.176.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.176.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.176.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.177.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.177.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.177.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.177.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.177.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.177.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.178.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.178.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.178.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.178.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.178.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.178.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.179.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.179.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.179.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.179.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.179.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.179.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.180.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.180.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.180.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.180.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.180.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.180.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.181.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.181.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.181.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.181.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.181.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.181.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.182.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.182.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.182.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.182.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.182.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.182.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.183.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.183.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.183.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.183.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.183.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.183.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.184.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.184.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.184.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.184.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.184.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.184.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.185.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.185.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.185.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.185.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.185.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.185.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.186.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.186.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.186.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.186.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.186.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.186.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.187.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.187.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.187.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.187.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.187.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.187.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.188.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.188.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.188.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.188.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.188.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.188.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.189.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.189.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.189.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.189.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.189.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.189.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.190.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.190.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.190.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.190.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.190.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.190.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.191.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.191.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.191.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.191.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.191.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.191.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.192.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.192.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.192.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.192.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.192.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.192.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.193.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.193.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.193.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.193.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.193.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.193.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.194.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.194.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.194.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.194.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.194.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.194.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.195.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.195.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.195.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.195.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.195.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.195.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.196.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.196.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.196.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.196.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.196.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.196.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.197.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.197.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.197.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.197.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.197.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.197.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.198.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.198.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.198.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.198.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.198.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.198.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.199.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.199.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.199.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.199.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.199.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.199.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.200.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.200.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.200.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.200.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.200.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.200.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.201.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.201.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.201.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.201.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.201.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.201.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.202.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.202.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.202.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.202.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.202.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.202.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.203.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.203.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.203.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.203.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.203.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.203.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.204.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.204.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.204.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.204.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.204.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.204.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.205.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.205.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.205.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.205.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.205.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.205.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.206.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.206.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.206.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.206.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.206.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.206.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.207.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.207.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.207.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.207.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.207.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.207.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.208.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.208.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.208.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.208.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.208.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.208.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.209.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.209.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.209.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.209.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.209.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.209.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.210.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.210.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.210.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.210.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.210.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.210.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.211.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.211.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.211.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.211.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.211.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.211.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.212.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.212.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.212.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.212.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.212.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.212.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.213.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.213.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.213.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.213.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.213.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.213.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.214.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.214.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.214.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.214.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.214.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.214.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.215.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.215.gate_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.215.up_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.215.up_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.215.down_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.215.down_proj.weight_scale_inv": "model-00121-of-000163.safetensors", "model.layers.46.mlp.experts.216.gate_proj.weight": "model-00121-of-000163.safetensors", - "model.layers.46.mlp.experts.216.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.216.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.216.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.216.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.216.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.217.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.217.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.217.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.217.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.217.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.217.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.218.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.218.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.218.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.218.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.218.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.218.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.219.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.219.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.219.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.219.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.219.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.219.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.220.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.220.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.220.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.220.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.220.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.220.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.221.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.221.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.221.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.221.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.221.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.221.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.222.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.222.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.222.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.222.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.222.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.222.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.223.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.223.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.223.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.223.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.223.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.223.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.224.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.224.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.224.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.224.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.224.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.224.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.225.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.225.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.225.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.225.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.225.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.225.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.226.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.226.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.226.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.226.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.226.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.226.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.227.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.227.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.227.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.227.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.227.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.227.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.228.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.228.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.228.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.228.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.228.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.228.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.229.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.229.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.229.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.229.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.229.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.229.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.230.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.230.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.230.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.230.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.230.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.230.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.231.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.231.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.231.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.231.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.231.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.231.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.232.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.232.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.232.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.232.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.232.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.232.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.233.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.233.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.233.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.233.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.233.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.233.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.234.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.234.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.234.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.234.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.234.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.234.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.235.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.235.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.235.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.235.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.235.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.235.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.236.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.236.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.236.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.236.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.236.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.236.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.237.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.237.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.237.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.237.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.237.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.237.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.238.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.238.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.238.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.238.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.238.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.238.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.239.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.239.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.239.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.239.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.239.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.239.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.240.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.240.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.240.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.240.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.240.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.240.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.241.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.241.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.241.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.241.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.241.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.241.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.242.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.242.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.242.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.242.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.242.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.242.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.243.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.243.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.243.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.243.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.243.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.243.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.244.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.244.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.244.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.244.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.244.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.244.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.245.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.245.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.245.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.245.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.245.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.245.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.246.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.246.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.246.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.246.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.246.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.246.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.247.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.247.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.247.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.247.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.247.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.247.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.248.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.248.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.248.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.248.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.248.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.248.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.249.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.249.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.249.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.249.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.249.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.249.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.250.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.250.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.250.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.250.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.250.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.250.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.251.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.251.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.251.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.251.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.251.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.251.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.252.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.252.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.252.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.252.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.252.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.252.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.253.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.253.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.253.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.253.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.253.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.253.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.254.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.254.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.254.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.254.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.254.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.254.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.255.gate_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.255.gate_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.255.up_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.255.up_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.mlp.experts.255.down_proj.weight": "model-00122-of-000163.safetensors", - "model.layers.46.mlp.experts.255.down_proj.weight_scale_inv": "model-00122-of-000163.safetensors", "model.layers.46.input_layernorm.weight": "model-00122-of-000163.safetensors", "model.layers.46.post_attention_layernorm.weight": "model-00122-of-000163.safetensors", "model.layers.47.self_attn.q_a_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.self_attn.q_a_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.q_a_layernorm.weight": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.q_b_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.self_attn.q_b_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.kv_a_proj_with_mqa.weight": "model-00123-of-000163.safetensors", - "model.layers.47.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.kv_a_layernorm.weight": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.kv_b_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.self_attn.kv_b_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.self_attn.o_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.self_attn.o_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.gate.weight": "model-00123-of-000163.safetensors", "model.layers.47.mlp.gate.e_score_correction_bias": "model-00123-of-000163.safetensors", "model.layers.47.mlp.shared_experts.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.shared_experts.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.shared_experts.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.shared_experts.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.shared_experts.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.0.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.0.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.0.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.0.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.0.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.0.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.1.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.1.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.1.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.1.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.1.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.1.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.2.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.2.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.2.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.2.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.2.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.2.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.3.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.3.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.3.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.3.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.3.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.3.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.4.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.4.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.4.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.4.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.4.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.4.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.5.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.5.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.5.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.5.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.5.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.5.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.6.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.6.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.6.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.6.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.6.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.6.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.7.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.7.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.7.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.7.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.7.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.7.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.8.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.8.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.8.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.8.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.8.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.8.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.9.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.9.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.9.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.9.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.9.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.9.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.10.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.10.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.10.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.10.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.10.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.10.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.11.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.11.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.11.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.11.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.11.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.11.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.12.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.12.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.12.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.12.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.12.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.12.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.13.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.13.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.13.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.13.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.13.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.13.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.14.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.14.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.14.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.14.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.14.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.14.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.15.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.15.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.15.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.15.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.15.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.15.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.16.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.16.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.16.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.16.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.16.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.16.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.17.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.17.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.17.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.17.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.17.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.17.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.18.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.18.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.18.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.18.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.18.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.18.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.19.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.19.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.19.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.19.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.19.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.19.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.20.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.20.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.20.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.20.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.20.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.20.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.21.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.21.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.21.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.21.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.21.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.21.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.22.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.22.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.22.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.22.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.22.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.22.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.23.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.23.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.23.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.23.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.23.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.23.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.24.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.24.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.24.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.24.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.24.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.24.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.25.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.25.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.25.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.25.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.25.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.25.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.26.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.26.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.26.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.26.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.26.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.26.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.27.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.27.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.27.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.27.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.27.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.27.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.28.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.28.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.28.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.28.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.28.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.28.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.29.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.29.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.29.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.29.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.29.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.29.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.30.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.30.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.30.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.30.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.30.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.30.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.31.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.31.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.31.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.31.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.31.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.31.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.32.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.32.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.32.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.32.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.32.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.32.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.33.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.33.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.33.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.33.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.33.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.33.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.34.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.34.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.34.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.34.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.34.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.34.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.35.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.35.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.35.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.35.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.35.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.35.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.36.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.36.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.36.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.36.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.36.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.36.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.37.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.37.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.37.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.37.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.37.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.37.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.38.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.38.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.38.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.38.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.38.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.38.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.39.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.39.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.39.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.39.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.39.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.39.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.40.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.40.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.40.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.40.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.40.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.40.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.41.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.41.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.41.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.41.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.41.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.41.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.42.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.42.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.42.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.42.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.42.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.42.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.43.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.43.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.43.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.43.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.43.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.43.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.44.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.44.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.44.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.44.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.44.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.44.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.45.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.45.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.45.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.45.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.45.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.45.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.46.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.46.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.46.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.46.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.46.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.46.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.47.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.47.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.47.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.47.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.47.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.47.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.48.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.48.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.48.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.48.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.48.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.48.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.49.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.49.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.49.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.49.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.49.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.49.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.50.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.50.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.50.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.50.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.50.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.50.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.51.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.51.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.51.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.51.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.51.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.51.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.52.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.52.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.52.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.52.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.52.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.52.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.53.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.53.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.53.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.53.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.53.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.53.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.54.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.54.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.54.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.54.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.54.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.54.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.55.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.55.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.55.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.55.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.55.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.55.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.56.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.56.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.56.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.56.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.56.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.56.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.57.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.57.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.57.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.57.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.57.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.57.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.58.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.58.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.58.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.58.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.58.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.58.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.59.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.59.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.59.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.59.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.59.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.59.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.60.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.60.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.60.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.60.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.60.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.60.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.61.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.61.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.61.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.61.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.61.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.61.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.62.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.62.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.62.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.62.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.62.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.62.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.63.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.63.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.63.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.63.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.63.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.63.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.64.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.64.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.64.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.64.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.64.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.64.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.65.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.65.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.65.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.65.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.65.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.65.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.66.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.66.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.66.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.66.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.66.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.66.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.67.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.67.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.67.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.67.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.67.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.67.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.68.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.68.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.68.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.68.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.68.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.68.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.69.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.69.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.69.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.69.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.69.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.69.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.70.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.70.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.70.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.70.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.70.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.70.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.71.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.71.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.71.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.71.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.71.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.71.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.72.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.72.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.72.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.72.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.72.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.72.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.73.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.73.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.73.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.73.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.73.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.73.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.74.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.74.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.74.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.74.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.74.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.74.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.75.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.75.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.75.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.75.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.75.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.75.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.76.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.76.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.76.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.76.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.76.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.76.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.77.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.77.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.77.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.77.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.77.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.77.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.78.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.78.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.78.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.78.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.78.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.78.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.79.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.79.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.79.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.79.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.79.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.79.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.80.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.80.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.80.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.80.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.80.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.80.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.81.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.81.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.81.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.81.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.81.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.81.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.82.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.82.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.82.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.82.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.82.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.82.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.83.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.83.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.83.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.83.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.83.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.83.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.84.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.84.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.84.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.84.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.84.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.84.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.85.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.85.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.85.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.85.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.85.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.85.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.86.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.86.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.86.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.86.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.86.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.86.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.87.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.87.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.87.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.87.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.87.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.87.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.88.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.88.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.88.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.88.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.88.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.88.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.89.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.89.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.89.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.89.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.89.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.89.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.90.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.90.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.90.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.90.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.90.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.90.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.91.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.91.gate_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.91.up_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.91.up_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.91.down_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.91.down_proj.weight_scale_inv": "model-00123-of-000163.safetensors", "model.layers.47.mlp.experts.92.gate_proj.weight": "model-00123-of-000163.safetensors", - "model.layers.47.mlp.experts.92.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.92.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.92.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.92.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.92.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.93.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.93.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.93.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.93.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.93.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.93.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.94.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.94.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.94.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.94.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.94.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.94.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.95.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.95.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.95.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.95.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.95.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.95.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.96.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.96.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.96.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.96.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.96.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.96.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.97.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.97.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.97.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.97.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.97.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.97.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.98.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.98.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.98.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.98.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.98.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.98.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.99.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.99.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.99.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.99.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.99.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.99.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.100.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.100.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.100.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.100.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.100.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.100.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.101.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.101.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.101.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.101.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.101.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.101.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.102.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.102.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.102.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.102.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.102.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.102.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.103.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.103.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.103.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.103.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.103.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.103.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.104.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.104.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.104.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.104.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.104.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.104.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.105.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.105.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.105.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.105.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.105.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.105.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.106.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.106.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.106.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.106.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.106.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.106.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.107.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.107.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.107.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.107.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.107.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.107.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.108.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.108.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.108.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.108.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.108.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.108.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.109.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.109.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.109.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.109.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.109.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.109.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.110.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.110.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.110.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.110.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.110.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.110.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.111.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.111.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.111.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.111.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.111.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.111.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.112.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.112.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.112.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.112.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.112.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.112.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.113.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.113.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.113.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.113.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.113.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.113.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.114.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.114.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.114.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.114.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.114.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.114.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.115.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.115.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.115.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.115.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.115.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.115.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.116.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.116.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.116.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.116.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.116.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.116.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.117.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.117.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.117.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.117.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.117.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.117.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.118.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.118.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.118.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.118.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.118.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.118.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.119.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.119.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.119.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.119.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.119.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.119.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.120.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.120.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.120.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.120.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.120.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.120.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.121.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.121.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.121.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.121.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.121.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.121.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.122.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.122.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.122.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.122.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.122.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.122.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.123.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.123.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.123.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.123.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.123.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.123.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.124.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.124.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.124.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.124.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.124.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.124.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.125.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.125.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.125.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.125.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.125.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.125.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.126.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.126.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.126.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.126.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.126.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.126.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.127.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.127.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.127.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.127.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.127.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.127.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.128.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.128.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.128.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.128.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.128.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.128.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.129.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.129.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.129.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.129.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.129.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.129.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.130.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.130.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.130.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.130.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.130.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.130.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.131.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.131.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.131.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.131.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.131.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.131.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.132.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.132.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.132.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.132.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.132.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.132.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.133.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.133.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.133.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.133.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.133.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.133.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.134.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.134.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.134.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.134.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.134.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.134.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.135.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.135.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.135.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.135.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.135.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.135.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.136.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.136.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.136.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.136.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.136.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.136.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.137.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.137.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.137.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.137.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.137.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.137.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.138.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.138.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.138.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.138.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.138.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.138.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.139.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.139.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.139.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.139.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.139.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.139.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.140.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.140.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.140.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.140.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.140.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.140.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.141.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.141.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.141.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.141.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.141.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.141.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.142.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.142.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.142.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.142.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.142.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.142.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.143.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.143.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.143.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.143.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.143.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.143.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.144.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.144.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.144.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.144.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.144.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.144.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.145.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.145.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.145.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.145.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.145.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.145.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.146.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.146.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.146.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.146.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.146.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.146.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.147.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.147.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.147.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.147.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.147.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.147.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.148.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.148.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.148.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.148.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.148.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.148.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.149.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.149.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.149.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.149.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.149.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.149.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.150.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.150.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.150.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.150.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.150.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.150.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.151.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.151.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.151.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.151.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.151.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.151.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.152.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.152.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.152.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.152.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.152.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.152.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.153.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.153.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.153.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.153.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.153.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.153.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.154.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.154.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.154.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.154.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.154.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.154.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.155.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.155.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.155.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.155.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.155.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.155.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.156.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.156.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.156.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.156.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.156.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.156.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.157.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.157.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.157.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.157.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.157.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.157.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.158.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.158.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.158.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.158.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.158.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.158.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.159.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.159.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.159.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.159.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.159.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.159.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.160.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.160.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.160.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.160.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.160.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.160.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.161.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.161.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.161.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.161.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.161.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.161.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.162.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.162.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.162.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.162.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.162.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.162.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.163.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.163.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.163.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.163.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.163.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.163.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.164.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.164.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.164.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.164.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.164.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.164.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.165.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.165.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.165.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.165.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.165.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.165.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.166.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.166.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.166.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.166.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.166.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.166.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.167.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.167.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.167.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.167.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.167.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.167.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.168.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.168.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.168.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.168.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.168.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.168.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.169.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.169.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.169.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.169.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.169.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.169.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.170.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.170.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.170.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.170.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.170.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.170.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.171.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.171.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.171.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.171.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.171.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.171.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.172.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.172.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.172.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.172.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.172.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.172.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.173.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.173.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.173.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.173.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.173.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.173.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.174.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.174.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.174.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.174.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.174.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.174.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.175.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.175.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.175.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.175.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.175.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.175.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.176.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.176.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.176.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.176.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.176.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.176.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.177.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.177.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.177.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.177.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.177.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.177.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.178.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.178.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.178.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.178.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.178.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.178.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.179.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.179.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.179.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.179.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.179.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.179.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.180.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.180.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.180.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.180.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.180.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.180.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.181.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.181.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.181.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.181.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.181.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.181.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.182.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.182.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.182.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.182.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.182.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.182.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.183.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.183.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.183.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.183.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.183.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.183.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.184.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.184.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.184.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.184.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.184.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.184.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.185.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.185.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.185.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.185.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.185.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.185.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.186.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.186.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.186.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.186.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.186.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.186.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.187.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.187.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.187.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.187.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.187.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.187.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.188.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.188.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.188.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.188.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.188.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.188.down_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.189.gate_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.189.gate_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.189.up_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.189.up_proj.weight_scale_inv": "model-00124-of-000163.safetensors", "model.layers.47.mlp.experts.189.down_proj.weight": "model-00124-of-000163.safetensors", - "model.layers.47.mlp.experts.189.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.190.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.190.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.190.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.190.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.190.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.190.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.191.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.191.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.191.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.191.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.191.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.191.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.192.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.192.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.192.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.192.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.192.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.192.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.193.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.193.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.193.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.193.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.193.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.193.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.194.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.194.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.194.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.194.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.194.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.194.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.195.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.195.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.195.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.195.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.195.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.195.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.196.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.196.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.196.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.196.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.196.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.196.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.197.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.197.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.197.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.197.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.197.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.197.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.198.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.198.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.198.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.198.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.198.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.198.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.199.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.199.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.199.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.199.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.199.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.199.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.200.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.200.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.200.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.200.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.200.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.200.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.201.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.201.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.201.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.201.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.201.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.201.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.202.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.202.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.202.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.202.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.202.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.202.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.203.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.203.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.203.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.203.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.203.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.203.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.204.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.204.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.204.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.204.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.204.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.204.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.205.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.205.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.205.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.205.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.205.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.205.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.206.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.206.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.206.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.206.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.206.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.206.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.207.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.207.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.207.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.207.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.207.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.207.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.208.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.208.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.208.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.208.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.208.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.208.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.209.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.209.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.209.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.209.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.209.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.209.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.210.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.210.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.210.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.210.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.210.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.210.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.211.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.211.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.211.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.211.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.211.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.211.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.212.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.212.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.212.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.212.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.212.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.212.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.213.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.213.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.213.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.213.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.213.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.213.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.214.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.214.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.214.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.214.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.214.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.214.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.215.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.215.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.215.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.215.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.215.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.215.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.216.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.216.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.216.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.216.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.216.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.216.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.217.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.217.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.217.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.217.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.217.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.217.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.218.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.218.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.218.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.218.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.218.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.218.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.219.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.219.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.219.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.219.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.219.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.219.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.220.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.220.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.220.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.220.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.220.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.220.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.221.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.221.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.221.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.221.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.221.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.221.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.222.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.222.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.222.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.222.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.222.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.222.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.223.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.223.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.223.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.223.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.223.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.223.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.224.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.224.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.224.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.224.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.224.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.224.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.225.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.225.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.225.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.225.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.225.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.225.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.226.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.226.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.226.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.226.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.226.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.226.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.227.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.227.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.227.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.227.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.227.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.227.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.228.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.228.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.228.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.228.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.228.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.228.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.229.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.229.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.229.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.229.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.229.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.229.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.230.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.230.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.230.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.230.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.230.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.230.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.231.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.231.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.231.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.231.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.231.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.231.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.232.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.232.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.232.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.232.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.232.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.232.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.233.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.233.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.233.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.233.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.233.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.233.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.234.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.234.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.234.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.234.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.234.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.234.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.235.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.235.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.235.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.235.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.235.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.235.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.236.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.236.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.236.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.236.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.236.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.236.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.237.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.237.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.237.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.237.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.237.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.237.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.238.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.238.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.238.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.238.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.238.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.238.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.239.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.239.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.239.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.239.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.239.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.239.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.240.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.240.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.240.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.240.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.240.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.240.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.241.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.241.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.241.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.241.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.241.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.241.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.242.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.242.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.242.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.242.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.242.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.242.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.243.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.243.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.243.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.243.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.243.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.243.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.244.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.244.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.244.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.244.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.244.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.244.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.245.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.245.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.245.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.245.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.245.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.245.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.246.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.246.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.246.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.246.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.246.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.246.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.247.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.247.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.247.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.247.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.247.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.247.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.248.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.248.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.248.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.248.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.248.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.248.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.249.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.249.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.249.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.249.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.249.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.249.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.250.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.250.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.250.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.250.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.250.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.250.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.251.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.251.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.251.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.251.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.251.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.251.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.252.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.252.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.252.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.252.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.252.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.252.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.253.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.253.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.253.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.253.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.253.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.253.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.254.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.254.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.254.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.254.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.254.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.254.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.255.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.255.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.255.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.255.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.mlp.experts.255.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.47.mlp.experts.255.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.47.input_layernorm.weight": "model-00125-of-000163.safetensors", "model.layers.47.post_attention_layernorm.weight": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.q_a_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.self_attn.q_a_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.q_a_layernorm.weight": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.q_b_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.self_attn.q_b_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.kv_a_proj_with_mqa.weight": "model-00125-of-000163.safetensors", - "model.layers.48.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.kv_a_layernorm.weight": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.kv_b_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.self_attn.kv_b_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.self_attn.o_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.self_attn.o_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.gate.weight": "model-00125-of-000163.safetensors", "model.layers.48.mlp.gate.e_score_correction_bias": "model-00125-of-000163.safetensors", "model.layers.48.mlp.shared_experts.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.shared_experts.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.shared_experts.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.shared_experts.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.shared_experts.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.0.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.0.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.0.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.0.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.0.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.0.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.1.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.1.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.1.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.1.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.1.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.1.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.2.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.2.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.2.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.2.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.2.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.2.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.3.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.3.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.3.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.3.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.3.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.3.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.4.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.4.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.4.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.4.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.4.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.4.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.5.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.5.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.5.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.5.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.5.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.5.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.6.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.6.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.6.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.6.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.6.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.6.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.7.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.7.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.7.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.7.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.7.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.7.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.8.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.8.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.8.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.8.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.8.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.8.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.9.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.9.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.9.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.9.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.9.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.9.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.10.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.10.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.10.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.10.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.10.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.10.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.11.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.11.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.11.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.11.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.11.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.11.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.12.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.12.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.12.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.12.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.12.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.12.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.13.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.13.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.13.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.13.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.13.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.13.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.14.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.14.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.14.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.14.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.14.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.14.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.15.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.15.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.15.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.15.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.15.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.15.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.16.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.16.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.16.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.16.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.16.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.16.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.17.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.17.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.17.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.17.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.17.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.17.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.18.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.18.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.18.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.18.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.18.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.18.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.19.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.19.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.19.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.19.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.19.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.19.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.20.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.20.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.20.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.20.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.20.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.20.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.21.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.21.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.21.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.21.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.21.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.21.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.22.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.22.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.22.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.22.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.22.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.22.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.23.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.23.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.23.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.23.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.23.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.23.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.24.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.24.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.24.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.24.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.24.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.24.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.25.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.25.gate_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.25.up_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.25.up_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.25.down_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.25.down_proj.weight_scale_inv": "model-00125-of-000163.safetensors", "model.layers.48.mlp.experts.26.gate_proj.weight": "model-00125-of-000163.safetensors", - "model.layers.48.mlp.experts.26.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.26.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.26.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.26.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.26.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.27.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.27.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.27.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.27.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.27.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.27.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.28.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.28.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.28.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.28.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.28.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.28.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.29.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.29.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.29.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.29.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.29.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.29.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.30.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.30.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.30.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.30.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.30.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.30.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.31.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.31.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.31.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.31.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.31.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.31.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.32.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.32.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.32.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.32.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.32.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.32.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.33.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.33.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.33.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.33.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.33.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.33.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.34.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.34.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.34.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.34.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.34.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.34.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.35.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.35.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.35.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.35.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.35.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.35.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.36.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.36.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.36.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.36.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.36.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.36.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.37.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.37.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.37.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.37.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.37.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.37.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.38.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.38.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.38.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.38.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.38.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.38.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.39.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.39.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.39.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.39.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.39.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.39.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.40.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.40.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.40.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.40.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.40.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.40.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.41.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.41.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.41.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.41.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.41.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.41.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.42.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.42.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.42.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.42.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.42.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.42.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.43.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.43.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.43.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.43.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.43.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.43.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.44.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.44.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.44.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.44.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.44.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.44.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.45.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.45.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.45.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.45.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.45.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.45.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.46.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.46.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.46.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.46.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.46.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.46.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.47.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.47.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.47.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.47.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.47.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.47.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.48.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.48.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.48.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.48.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.48.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.48.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.49.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.49.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.49.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.49.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.49.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.49.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.50.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.50.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.50.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.50.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.50.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.50.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.51.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.51.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.51.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.51.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.51.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.51.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.52.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.52.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.52.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.52.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.52.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.52.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.53.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.53.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.53.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.53.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.53.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.53.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.54.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.54.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.54.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.54.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.54.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.54.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.55.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.55.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.55.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.55.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.55.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.55.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.56.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.56.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.56.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.56.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.56.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.56.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.57.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.57.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.57.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.57.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.57.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.57.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.58.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.58.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.58.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.58.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.58.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.58.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.59.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.59.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.59.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.59.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.59.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.59.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.60.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.60.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.60.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.60.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.60.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.60.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.61.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.61.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.61.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.61.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.61.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.61.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.62.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.62.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.62.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.62.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.62.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.62.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.63.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.63.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.63.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.63.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.63.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.63.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.64.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.64.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.64.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.64.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.64.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.64.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.65.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.65.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.65.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.65.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.65.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.65.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.66.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.66.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.66.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.66.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.66.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.66.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.67.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.67.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.67.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.67.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.67.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.67.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.68.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.68.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.68.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.68.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.68.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.68.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.69.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.69.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.69.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.69.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.69.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.69.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.70.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.70.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.70.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.70.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.70.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.70.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.71.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.71.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.71.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.71.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.71.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.71.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.72.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.72.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.72.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.72.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.72.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.72.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.73.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.73.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.73.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.73.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.73.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.73.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.74.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.74.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.74.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.74.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.74.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.74.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.75.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.75.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.75.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.75.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.75.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.75.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.76.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.76.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.76.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.76.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.76.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.76.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.77.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.77.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.77.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.77.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.77.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.77.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.78.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.78.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.78.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.78.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.78.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.78.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.79.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.79.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.79.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.79.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.79.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.79.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.80.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.80.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.80.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.80.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.80.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.80.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.81.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.81.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.81.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.81.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.81.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.81.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.82.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.82.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.82.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.82.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.82.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.82.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.83.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.83.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.83.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.83.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.83.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.83.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.84.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.84.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.84.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.84.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.84.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.84.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.85.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.85.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.85.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.85.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.85.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.85.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.86.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.86.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.86.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.86.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.86.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.86.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.87.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.87.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.87.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.87.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.87.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.87.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.88.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.88.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.88.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.88.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.88.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.88.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.89.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.89.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.89.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.89.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.89.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.89.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.90.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.90.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.90.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.90.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.90.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.90.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.91.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.91.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.91.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.91.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.91.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.91.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.92.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.92.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.92.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.92.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.92.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.92.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.93.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.93.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.93.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.93.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.93.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.93.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.94.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.94.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.94.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.94.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.94.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.94.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.95.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.95.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.95.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.95.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.95.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.95.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.96.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.96.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.96.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.96.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.96.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.96.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.97.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.97.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.97.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.97.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.97.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.97.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.98.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.98.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.98.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.98.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.98.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.98.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.99.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.99.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.99.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.99.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.99.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.99.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.100.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.100.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.100.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.100.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.100.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.100.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.101.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.101.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.101.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.101.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.101.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.101.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.102.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.102.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.102.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.102.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.102.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.102.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.103.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.103.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.103.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.103.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.103.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.103.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.104.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.104.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.104.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.104.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.104.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.104.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.105.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.105.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.105.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.105.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.105.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.105.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.106.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.106.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.106.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.106.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.106.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.106.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.107.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.107.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.107.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.107.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.107.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.107.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.108.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.108.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.108.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.108.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.108.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.108.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.109.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.109.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.109.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.109.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.109.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.109.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.110.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.110.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.110.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.110.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.110.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.110.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.111.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.111.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.111.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.111.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.111.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.111.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.112.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.112.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.112.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.112.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.112.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.112.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.113.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.113.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.113.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.113.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.113.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.113.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.114.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.114.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.114.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.114.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.114.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.114.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.115.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.115.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.115.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.115.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.115.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.115.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.116.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.116.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.116.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.116.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.116.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.116.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.117.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.117.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.117.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.117.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.117.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.117.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.118.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.118.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.118.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.118.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.118.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.118.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.119.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.119.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.119.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.119.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.119.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.119.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.120.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.120.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.120.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.120.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.120.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.120.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.121.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.121.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.121.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.121.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.121.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.121.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.122.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.122.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.122.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.122.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.122.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.122.down_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.123.gate_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.123.gate_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.123.up_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.123.up_proj.weight_scale_inv": "model-00126-of-000163.safetensors", "model.layers.48.mlp.experts.123.down_proj.weight": "model-00126-of-000163.safetensors", - "model.layers.48.mlp.experts.123.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.124.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.124.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.124.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.124.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.124.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.124.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.125.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.125.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.125.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.125.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.125.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.125.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.126.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.126.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.126.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.126.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.126.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.126.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.127.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.127.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.127.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.127.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.127.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.127.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.128.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.128.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.128.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.128.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.128.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.128.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.129.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.129.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.129.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.129.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.129.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.129.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.130.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.130.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.130.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.130.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.130.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.130.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.131.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.131.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.131.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.131.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.131.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.131.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.132.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.132.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.132.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.132.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.132.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.132.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.133.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.133.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.133.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.133.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.133.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.133.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.134.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.134.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.134.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.134.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.134.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.134.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.135.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.135.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.135.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.135.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.135.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.135.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.136.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.136.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.136.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.136.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.136.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.136.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.137.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.137.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.137.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.137.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.137.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.137.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.138.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.138.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.138.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.138.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.138.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.138.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.139.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.139.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.139.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.139.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.139.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.139.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.140.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.140.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.140.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.140.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.140.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.140.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.141.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.141.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.141.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.141.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.141.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.141.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.142.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.142.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.142.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.142.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.142.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.142.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.143.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.143.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.143.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.143.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.143.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.143.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.144.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.144.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.144.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.144.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.144.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.144.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.145.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.145.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.145.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.145.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.145.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.145.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.146.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.146.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.146.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.146.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.146.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.146.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.147.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.147.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.147.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.147.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.147.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.147.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.148.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.148.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.148.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.148.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.148.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.148.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.149.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.149.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.149.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.149.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.149.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.149.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.150.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.150.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.150.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.150.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.150.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.150.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.151.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.151.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.151.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.151.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.151.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.151.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.152.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.152.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.152.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.152.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.152.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.152.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.153.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.153.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.153.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.153.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.153.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.153.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.154.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.154.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.154.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.154.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.154.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.154.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.155.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.155.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.155.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.155.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.155.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.155.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.156.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.156.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.156.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.156.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.156.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.156.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.157.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.157.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.157.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.157.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.157.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.157.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.158.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.158.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.158.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.158.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.158.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.158.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.159.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.159.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.159.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.159.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.159.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.159.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.160.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.160.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.160.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.160.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.160.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.160.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.161.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.161.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.161.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.161.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.161.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.161.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.162.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.162.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.162.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.162.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.162.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.162.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.163.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.163.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.163.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.163.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.163.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.163.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.164.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.164.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.164.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.164.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.164.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.164.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.165.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.165.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.165.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.165.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.165.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.165.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.166.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.166.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.166.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.166.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.166.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.166.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.167.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.167.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.167.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.167.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.167.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.167.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.168.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.168.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.168.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.168.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.168.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.168.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.169.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.169.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.169.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.169.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.169.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.169.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.170.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.170.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.170.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.170.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.170.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.170.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.171.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.171.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.171.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.171.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.171.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.171.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.172.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.172.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.172.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.172.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.172.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.172.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.173.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.173.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.173.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.173.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.173.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.173.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.174.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.174.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.174.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.174.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.174.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.174.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.175.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.175.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.175.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.175.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.175.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.175.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.176.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.176.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.176.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.176.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.176.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.176.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.177.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.177.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.177.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.177.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.177.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.177.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.178.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.178.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.178.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.178.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.178.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.178.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.179.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.179.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.179.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.179.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.179.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.179.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.180.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.180.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.180.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.180.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.180.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.180.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.181.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.181.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.181.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.181.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.181.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.181.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.182.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.182.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.182.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.182.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.182.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.182.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.183.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.183.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.183.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.183.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.183.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.183.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.184.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.184.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.184.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.184.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.184.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.184.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.185.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.185.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.185.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.185.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.185.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.185.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.186.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.186.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.186.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.186.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.186.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.186.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.187.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.187.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.187.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.187.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.187.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.187.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.188.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.188.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.188.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.188.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.188.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.188.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.189.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.189.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.189.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.189.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.189.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.189.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.190.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.190.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.190.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.190.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.190.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.190.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.191.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.191.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.191.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.191.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.191.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.191.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.192.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.192.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.192.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.192.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.192.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.192.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.193.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.193.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.193.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.193.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.193.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.193.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.194.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.194.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.194.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.194.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.194.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.194.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.195.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.195.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.195.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.195.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.195.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.195.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.196.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.196.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.196.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.196.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.196.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.196.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.197.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.197.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.197.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.197.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.197.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.197.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.198.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.198.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.198.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.198.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.198.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.198.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.199.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.199.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.199.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.199.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.199.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.199.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.200.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.200.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.200.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.200.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.200.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.200.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.201.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.201.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.201.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.201.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.201.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.201.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.202.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.202.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.202.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.202.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.202.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.202.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.203.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.203.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.203.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.203.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.203.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.203.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.204.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.204.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.204.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.204.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.204.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.204.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.205.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.205.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.205.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.205.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.205.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.205.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.206.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.206.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.206.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.206.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.206.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.206.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.207.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.207.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.207.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.207.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.207.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.207.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.208.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.208.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.208.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.208.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.208.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.208.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.209.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.209.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.209.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.209.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.209.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.209.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.210.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.210.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.210.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.210.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.210.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.210.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.211.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.211.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.211.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.211.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.211.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.211.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.212.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.212.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.212.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.212.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.212.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.212.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.213.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.213.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.213.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.213.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.213.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.213.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.214.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.214.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.214.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.214.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.214.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.214.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.215.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.215.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.215.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.215.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.215.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.215.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.216.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.216.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.216.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.216.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.216.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.216.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.217.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.217.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.217.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.217.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.217.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.217.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.218.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.218.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.218.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.218.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.218.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.218.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.219.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.219.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.219.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.219.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.219.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.219.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.220.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.220.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.220.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.220.up_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.220.down_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.220.down_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.221.gate_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.221.gate_proj.weight_scale_inv": "model-00127-of-000163.safetensors", "model.layers.48.mlp.experts.221.up_proj.weight": "model-00127-of-000163.safetensors", - "model.layers.48.mlp.experts.221.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.221.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.221.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.222.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.222.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.222.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.222.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.222.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.222.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.223.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.223.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.223.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.223.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.223.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.223.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.224.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.224.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.224.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.224.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.224.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.224.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.225.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.225.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.225.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.225.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.225.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.225.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.226.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.226.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.226.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.226.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.226.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.226.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.227.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.227.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.227.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.227.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.227.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.227.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.228.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.228.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.228.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.228.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.228.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.228.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.229.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.229.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.229.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.229.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.229.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.229.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.230.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.230.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.230.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.230.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.230.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.230.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.231.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.231.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.231.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.231.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.231.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.231.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.232.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.232.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.232.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.232.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.232.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.232.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.233.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.233.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.233.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.233.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.233.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.233.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.234.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.234.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.234.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.234.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.234.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.234.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.235.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.235.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.235.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.235.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.235.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.235.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.236.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.236.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.236.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.236.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.236.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.236.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.237.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.237.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.237.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.237.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.237.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.237.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.238.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.238.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.238.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.238.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.238.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.238.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.239.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.239.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.239.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.239.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.239.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.239.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.240.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.240.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.240.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.240.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.240.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.240.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.241.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.241.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.241.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.241.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.241.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.241.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.242.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.242.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.242.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.242.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.242.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.242.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.243.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.243.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.243.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.243.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.243.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.243.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.244.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.244.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.244.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.244.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.244.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.244.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.245.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.245.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.245.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.245.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.245.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.245.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.246.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.246.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.246.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.246.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.246.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.246.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.247.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.247.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.247.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.247.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.247.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.247.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.248.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.248.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.248.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.248.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.248.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.248.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.249.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.249.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.249.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.249.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.249.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.249.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.250.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.250.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.250.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.250.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.250.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.250.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.251.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.251.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.251.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.251.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.251.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.251.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.252.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.252.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.252.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.252.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.252.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.252.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.253.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.253.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.253.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.253.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.253.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.253.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.254.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.254.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.254.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.254.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.254.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.254.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.255.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.255.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.255.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.255.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.mlp.experts.255.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.48.mlp.experts.255.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.48.input_layernorm.weight": "model-00128-of-000163.safetensors", "model.layers.48.post_attention_layernorm.weight": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.q_a_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.self_attn.q_a_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.q_a_layernorm.weight": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.q_b_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.self_attn.q_b_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.kv_a_proj_with_mqa.weight": "model-00128-of-000163.safetensors", - "model.layers.49.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.kv_a_layernorm.weight": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.kv_b_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.self_attn.kv_b_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.self_attn.o_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.self_attn.o_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.gate.weight": "model-00128-of-000163.safetensors", "model.layers.49.mlp.gate.e_score_correction_bias": "model-00128-of-000163.safetensors", "model.layers.49.mlp.shared_experts.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.shared_experts.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.shared_experts.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.shared_experts.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.shared_experts.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.0.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.0.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.0.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.0.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.0.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.0.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.1.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.1.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.1.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.1.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.1.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.1.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.2.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.2.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.2.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.2.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.2.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.2.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.3.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.3.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.3.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.3.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.3.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.3.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.4.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.4.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.4.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.4.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.4.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.4.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.5.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.5.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.5.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.5.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.5.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.5.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.6.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.6.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.6.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.6.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.6.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.6.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.7.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.7.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.7.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.7.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.7.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.7.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.8.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.8.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.8.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.8.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.8.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.8.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.9.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.9.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.9.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.9.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.9.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.9.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.10.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.10.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.10.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.10.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.10.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.10.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.11.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.11.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.11.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.11.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.11.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.11.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.12.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.12.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.12.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.12.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.12.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.12.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.13.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.13.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.13.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.13.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.13.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.13.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.14.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.14.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.14.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.14.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.14.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.14.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.15.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.15.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.15.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.15.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.15.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.15.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.16.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.16.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.16.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.16.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.16.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.16.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.17.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.17.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.17.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.17.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.17.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.17.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.18.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.18.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.18.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.18.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.18.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.18.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.19.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.19.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.19.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.19.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.19.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.19.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.20.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.20.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.20.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.20.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.20.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.20.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.21.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.21.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.21.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.21.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.21.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.21.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.22.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.22.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.22.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.22.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.22.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.22.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.23.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.23.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.23.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.23.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.23.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.23.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.24.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.24.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.24.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.24.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.24.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.24.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.25.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.25.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.25.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.25.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.25.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.25.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.26.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.26.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.26.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.26.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.26.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.26.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.27.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.27.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.27.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.27.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.27.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.27.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.28.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.28.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.28.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.28.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.28.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.28.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.29.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.29.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.29.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.29.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.29.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.29.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.30.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.30.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.30.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.30.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.30.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.30.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.31.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.31.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.31.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.31.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.31.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.31.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.32.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.32.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.32.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.32.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.32.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.32.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.33.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.33.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.33.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.33.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.33.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.33.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.34.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.34.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.34.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.34.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.34.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.34.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.35.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.35.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.35.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.35.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.35.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.35.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.36.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.36.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.36.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.36.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.36.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.36.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.37.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.37.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.37.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.37.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.37.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.37.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.38.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.38.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.38.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.38.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.38.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.38.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.39.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.39.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.39.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.39.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.39.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.39.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.40.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.40.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.40.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.40.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.40.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.40.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.41.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.41.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.41.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.41.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.41.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.41.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.42.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.42.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.42.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.42.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.42.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.42.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.43.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.43.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.43.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.43.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.43.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.43.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.44.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.44.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.44.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.44.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.44.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.44.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.45.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.45.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.45.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.45.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.45.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.45.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.46.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.46.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.46.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.46.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.46.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.46.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.47.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.47.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.47.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.47.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.47.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.47.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.48.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.48.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.48.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.48.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.48.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.48.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.49.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.49.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.49.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.49.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.49.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.49.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.50.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.50.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.50.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.50.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.50.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.50.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.51.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.51.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.51.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.51.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.51.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.51.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.52.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.52.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.52.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.52.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.52.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.52.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.53.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.53.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.53.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.53.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.53.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.53.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.54.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.54.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.54.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.54.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.54.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.54.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.55.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.55.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.55.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.55.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.55.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.55.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.56.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.56.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.56.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.56.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.56.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.56.down_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.57.gate_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.57.gate_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.57.up_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.57.up_proj.weight_scale_inv": "model-00128-of-000163.safetensors", "model.layers.49.mlp.experts.57.down_proj.weight": "model-00128-of-000163.safetensors", - "model.layers.49.mlp.experts.57.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.58.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.58.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.58.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.58.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.58.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.58.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.59.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.59.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.59.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.59.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.59.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.59.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.60.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.60.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.60.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.60.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.60.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.60.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.61.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.61.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.61.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.61.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.61.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.61.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.62.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.62.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.62.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.62.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.62.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.62.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.63.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.63.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.63.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.63.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.63.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.63.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.64.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.64.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.64.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.64.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.64.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.64.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.65.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.65.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.65.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.65.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.65.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.65.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.66.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.66.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.66.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.66.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.66.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.66.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.67.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.67.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.67.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.67.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.67.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.67.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.68.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.68.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.68.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.68.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.68.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.68.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.69.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.69.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.69.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.69.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.69.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.69.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.70.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.70.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.70.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.70.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.70.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.70.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.71.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.71.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.71.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.71.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.71.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.71.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.72.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.72.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.72.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.72.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.72.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.72.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.73.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.73.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.73.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.73.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.73.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.73.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.74.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.74.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.74.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.74.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.74.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.74.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.75.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.75.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.75.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.75.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.75.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.75.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.76.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.76.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.76.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.76.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.76.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.76.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.77.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.77.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.77.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.77.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.77.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.77.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.78.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.78.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.78.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.78.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.78.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.78.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.79.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.79.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.79.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.79.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.79.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.79.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.80.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.80.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.80.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.80.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.80.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.80.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.81.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.81.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.81.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.81.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.81.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.81.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.82.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.82.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.82.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.82.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.82.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.82.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.83.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.83.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.83.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.83.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.83.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.83.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.84.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.84.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.84.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.84.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.84.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.84.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.85.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.85.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.85.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.85.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.85.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.85.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.86.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.86.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.86.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.86.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.86.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.86.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.87.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.87.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.87.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.87.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.87.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.87.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.88.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.88.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.88.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.88.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.88.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.88.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.89.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.89.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.89.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.89.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.89.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.89.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.90.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.90.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.90.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.90.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.90.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.90.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.91.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.91.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.91.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.91.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.91.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.91.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.92.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.92.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.92.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.92.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.92.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.92.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.93.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.93.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.93.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.93.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.93.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.93.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.94.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.94.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.94.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.94.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.94.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.94.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.95.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.95.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.95.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.95.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.95.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.95.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.96.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.96.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.96.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.96.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.96.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.96.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.97.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.97.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.97.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.97.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.97.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.97.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.98.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.98.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.98.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.98.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.98.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.98.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.99.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.99.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.99.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.99.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.99.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.99.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.100.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.100.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.100.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.100.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.100.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.100.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.101.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.101.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.101.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.101.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.101.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.101.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.102.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.102.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.102.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.102.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.102.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.102.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.103.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.103.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.103.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.103.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.103.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.103.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.104.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.104.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.104.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.104.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.104.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.104.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.105.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.105.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.105.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.105.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.105.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.105.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.106.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.106.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.106.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.106.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.106.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.106.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.107.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.107.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.107.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.107.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.107.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.107.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.108.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.108.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.108.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.108.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.108.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.108.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.109.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.109.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.109.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.109.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.109.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.109.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.110.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.110.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.110.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.110.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.110.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.110.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.111.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.111.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.111.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.111.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.111.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.111.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.112.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.112.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.112.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.112.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.112.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.112.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.113.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.113.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.113.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.113.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.113.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.113.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.114.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.114.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.114.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.114.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.114.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.114.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.115.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.115.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.115.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.115.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.115.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.115.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.116.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.116.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.116.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.116.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.116.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.116.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.117.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.117.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.117.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.117.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.117.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.117.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.118.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.118.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.118.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.118.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.118.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.118.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.119.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.119.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.119.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.119.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.119.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.119.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.120.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.120.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.120.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.120.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.120.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.120.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.121.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.121.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.121.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.121.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.121.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.121.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.122.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.122.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.122.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.122.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.122.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.122.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.123.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.123.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.123.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.123.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.123.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.123.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.124.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.124.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.124.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.124.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.124.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.124.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.125.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.125.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.125.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.125.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.125.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.125.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.126.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.126.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.126.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.126.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.126.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.126.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.127.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.127.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.127.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.127.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.127.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.127.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.128.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.128.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.128.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.128.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.128.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.128.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.129.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.129.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.129.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.129.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.129.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.129.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.130.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.130.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.130.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.130.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.130.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.130.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.131.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.131.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.131.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.131.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.131.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.131.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.132.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.132.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.132.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.132.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.132.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.132.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.133.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.133.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.133.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.133.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.133.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.133.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.134.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.134.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.134.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.134.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.134.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.134.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.135.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.135.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.135.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.135.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.135.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.135.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.136.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.136.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.136.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.136.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.136.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.136.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.137.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.137.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.137.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.137.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.137.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.137.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.138.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.138.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.138.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.138.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.138.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.138.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.139.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.139.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.139.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.139.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.139.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.139.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.140.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.140.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.140.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.140.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.140.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.140.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.141.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.141.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.141.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.141.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.141.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.141.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.142.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.142.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.142.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.142.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.142.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.142.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.143.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.143.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.143.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.143.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.143.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.143.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.144.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.144.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.144.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.144.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.144.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.144.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.145.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.145.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.145.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.145.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.145.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.145.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.146.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.146.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.146.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.146.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.146.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.146.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.147.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.147.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.147.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.147.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.147.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.147.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.148.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.148.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.148.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.148.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.148.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.148.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.149.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.149.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.149.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.149.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.149.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.149.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.150.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.150.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.150.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.150.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.150.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.150.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.151.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.151.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.151.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.151.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.151.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.151.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.152.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.152.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.152.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.152.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.152.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.152.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.153.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.153.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.153.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.153.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.153.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.153.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.154.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.154.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.154.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.154.up_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.154.down_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.154.down_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.155.gate_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.155.gate_proj.weight_scale_inv": "model-00129-of-000163.safetensors", "model.layers.49.mlp.experts.155.up_proj.weight": "model-00129-of-000163.safetensors", - "model.layers.49.mlp.experts.155.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.155.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.155.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.156.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.156.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.156.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.156.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.156.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.156.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.157.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.157.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.157.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.157.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.157.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.157.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.158.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.158.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.158.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.158.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.158.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.158.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.159.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.159.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.159.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.159.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.159.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.159.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.160.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.160.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.160.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.160.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.160.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.160.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.161.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.161.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.161.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.161.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.161.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.161.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.162.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.162.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.162.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.162.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.162.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.162.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.163.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.163.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.163.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.163.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.163.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.163.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.164.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.164.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.164.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.164.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.164.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.164.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.165.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.165.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.165.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.165.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.165.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.165.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.166.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.166.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.166.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.166.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.166.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.166.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.167.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.167.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.167.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.167.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.167.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.167.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.168.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.168.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.168.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.168.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.168.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.168.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.169.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.169.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.169.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.169.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.169.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.169.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.170.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.170.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.170.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.170.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.170.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.170.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.171.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.171.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.171.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.171.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.171.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.171.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.172.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.172.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.172.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.172.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.172.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.172.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.173.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.173.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.173.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.173.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.173.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.173.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.174.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.174.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.174.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.174.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.174.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.174.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.175.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.175.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.175.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.175.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.175.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.175.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.176.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.176.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.176.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.176.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.176.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.176.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.177.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.177.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.177.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.177.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.177.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.177.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.178.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.178.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.178.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.178.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.178.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.178.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.179.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.179.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.179.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.179.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.179.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.179.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.180.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.180.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.180.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.180.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.180.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.180.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.181.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.181.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.181.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.181.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.181.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.181.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.182.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.182.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.182.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.182.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.182.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.182.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.183.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.183.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.183.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.183.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.183.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.183.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.184.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.184.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.184.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.184.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.184.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.184.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.185.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.185.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.185.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.185.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.185.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.185.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.186.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.186.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.186.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.186.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.186.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.186.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.187.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.187.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.187.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.187.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.187.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.187.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.188.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.188.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.188.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.188.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.188.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.188.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.189.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.189.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.189.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.189.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.189.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.189.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.190.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.190.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.190.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.190.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.190.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.190.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.191.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.191.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.191.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.191.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.191.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.191.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.192.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.192.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.192.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.192.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.192.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.192.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.193.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.193.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.193.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.193.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.193.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.193.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.194.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.194.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.194.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.194.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.194.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.194.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.195.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.195.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.195.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.195.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.195.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.195.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.196.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.196.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.196.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.196.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.196.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.196.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.197.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.197.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.197.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.197.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.197.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.197.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.198.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.198.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.198.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.198.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.198.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.198.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.199.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.199.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.199.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.199.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.199.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.199.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.200.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.200.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.200.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.200.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.200.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.200.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.201.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.201.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.201.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.201.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.201.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.201.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.202.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.202.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.202.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.202.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.202.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.202.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.203.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.203.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.203.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.203.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.203.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.203.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.204.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.204.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.204.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.204.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.204.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.204.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.205.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.205.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.205.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.205.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.205.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.205.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.206.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.206.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.206.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.206.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.206.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.206.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.207.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.207.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.207.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.207.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.207.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.207.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.208.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.208.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.208.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.208.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.208.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.208.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.209.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.209.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.209.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.209.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.209.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.209.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.210.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.210.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.210.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.210.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.210.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.210.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.211.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.211.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.211.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.211.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.211.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.211.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.212.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.212.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.212.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.212.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.212.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.212.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.213.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.213.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.213.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.213.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.213.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.213.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.214.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.214.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.214.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.214.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.214.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.214.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.215.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.215.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.215.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.215.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.215.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.215.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.216.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.216.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.216.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.216.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.216.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.216.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.217.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.217.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.217.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.217.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.217.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.217.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.218.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.218.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.218.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.218.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.218.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.218.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.219.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.219.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.219.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.219.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.219.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.219.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.220.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.220.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.220.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.220.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.220.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.220.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.221.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.221.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.221.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.221.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.221.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.221.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.222.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.222.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.222.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.222.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.222.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.222.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.223.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.223.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.223.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.223.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.223.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.223.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.224.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.224.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.224.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.224.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.224.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.224.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.225.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.225.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.225.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.225.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.225.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.225.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.226.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.226.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.226.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.226.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.226.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.226.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.227.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.227.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.227.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.227.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.227.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.227.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.228.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.228.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.228.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.228.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.228.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.228.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.229.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.229.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.229.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.229.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.229.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.229.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.230.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.230.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.230.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.230.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.230.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.230.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.231.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.231.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.231.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.231.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.231.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.231.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.232.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.232.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.232.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.232.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.232.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.232.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.233.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.233.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.233.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.233.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.233.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.233.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.234.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.234.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.234.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.234.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.234.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.234.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.235.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.235.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.235.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.235.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.235.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.235.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.236.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.236.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.236.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.236.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.236.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.236.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.237.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.237.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.237.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.237.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.237.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.237.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.238.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.238.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.238.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.238.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.238.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.238.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.239.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.239.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.239.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.239.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.239.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.239.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.240.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.240.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.240.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.240.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.240.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.240.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.241.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.241.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.241.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.241.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.241.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.241.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.242.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.242.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.242.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.242.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.242.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.242.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.243.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.243.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.243.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.243.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.243.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.243.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.244.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.244.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.244.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.244.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.244.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.244.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.245.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.245.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.245.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.245.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.245.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.245.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.246.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.246.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.246.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.246.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.246.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.246.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.247.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.247.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.247.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.247.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.247.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.247.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.248.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.248.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.248.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.248.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.248.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.248.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.249.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.249.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.249.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.249.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.249.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.249.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.250.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.250.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.250.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.250.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.250.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.250.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.251.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.251.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.251.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.251.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.251.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.251.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.252.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.252.gate_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.252.up_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.252.up_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.252.down_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.252.down_proj.weight_scale_inv": "model-00130-of-000163.safetensors", "model.layers.49.mlp.experts.253.gate_proj.weight": "model-00130-of-000163.safetensors", - "model.layers.49.mlp.experts.253.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.253.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.253.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.253.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.253.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.254.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.254.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.254.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.254.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.254.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.254.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.255.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.255.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.255.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.255.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.mlp.experts.255.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.49.mlp.experts.255.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.49.input_layernorm.weight": "model-00131-of-000163.safetensors", "model.layers.49.post_attention_layernorm.weight": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.q_a_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.self_attn.q_a_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.q_a_layernorm.weight": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.q_b_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.self_attn.q_b_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.kv_a_proj_with_mqa.weight": "model-00131-of-000163.safetensors", - "model.layers.50.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.kv_a_layernorm.weight": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.kv_b_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.self_attn.kv_b_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.self_attn.o_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.self_attn.o_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.gate.weight": "model-00131-of-000163.safetensors", "model.layers.50.mlp.gate.e_score_correction_bias": "model-00131-of-000163.safetensors", "model.layers.50.mlp.shared_experts.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.shared_experts.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.shared_experts.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.shared_experts.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.shared_experts.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.0.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.0.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.0.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.0.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.0.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.0.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.1.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.1.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.1.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.1.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.1.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.1.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.2.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.2.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.2.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.2.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.2.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.2.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.3.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.3.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.3.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.3.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.3.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.3.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.4.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.4.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.4.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.4.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.4.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.4.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.5.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.5.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.5.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.5.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.5.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.5.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.6.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.6.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.6.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.6.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.6.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.6.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.7.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.7.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.7.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.7.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.7.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.7.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.8.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.8.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.8.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.8.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.8.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.8.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.9.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.9.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.9.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.9.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.9.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.9.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.10.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.10.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.10.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.10.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.10.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.10.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.11.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.11.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.11.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.11.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.11.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.11.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.12.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.12.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.12.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.12.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.12.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.12.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.13.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.13.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.13.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.13.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.13.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.13.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.14.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.14.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.14.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.14.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.14.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.14.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.15.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.15.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.15.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.15.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.15.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.15.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.16.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.16.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.16.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.16.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.16.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.16.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.17.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.17.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.17.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.17.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.17.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.17.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.18.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.18.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.18.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.18.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.18.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.18.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.19.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.19.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.19.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.19.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.19.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.19.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.20.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.20.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.20.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.20.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.20.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.20.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.21.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.21.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.21.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.21.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.21.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.21.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.22.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.22.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.22.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.22.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.22.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.22.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.23.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.23.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.23.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.23.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.23.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.23.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.24.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.24.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.24.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.24.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.24.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.24.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.25.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.25.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.25.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.25.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.25.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.25.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.26.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.26.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.26.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.26.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.26.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.26.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.27.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.27.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.27.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.27.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.27.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.27.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.28.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.28.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.28.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.28.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.28.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.28.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.29.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.29.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.29.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.29.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.29.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.29.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.30.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.30.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.30.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.30.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.30.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.30.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.31.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.31.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.31.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.31.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.31.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.31.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.32.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.32.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.32.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.32.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.32.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.32.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.33.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.33.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.33.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.33.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.33.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.33.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.34.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.34.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.34.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.34.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.34.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.34.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.35.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.35.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.35.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.35.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.35.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.35.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.36.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.36.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.36.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.36.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.36.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.36.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.37.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.37.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.37.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.37.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.37.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.37.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.38.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.38.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.38.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.38.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.38.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.38.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.39.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.39.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.39.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.39.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.39.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.39.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.40.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.40.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.40.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.40.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.40.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.40.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.41.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.41.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.41.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.41.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.41.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.41.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.42.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.42.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.42.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.42.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.42.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.42.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.43.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.43.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.43.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.43.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.43.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.43.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.44.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.44.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.44.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.44.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.44.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.44.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.45.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.45.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.45.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.45.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.45.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.45.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.46.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.46.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.46.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.46.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.46.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.46.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.47.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.47.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.47.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.47.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.47.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.47.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.48.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.48.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.48.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.48.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.48.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.48.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.49.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.49.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.49.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.49.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.49.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.49.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.50.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.50.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.50.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.50.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.50.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.50.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.51.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.51.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.51.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.51.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.51.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.51.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.52.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.52.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.52.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.52.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.52.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.52.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.53.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.53.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.53.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.53.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.53.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.53.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.54.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.54.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.54.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.54.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.54.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.54.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.55.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.55.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.55.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.55.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.55.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.55.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.56.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.56.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.56.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.56.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.56.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.56.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.57.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.57.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.57.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.57.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.57.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.57.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.58.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.58.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.58.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.58.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.58.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.58.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.59.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.59.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.59.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.59.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.59.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.59.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.60.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.60.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.60.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.60.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.60.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.60.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.61.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.61.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.61.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.61.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.61.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.61.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.62.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.62.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.62.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.62.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.62.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.62.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.63.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.63.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.63.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.63.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.63.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.63.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.64.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.64.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.64.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.64.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.64.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.64.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.65.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.65.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.65.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.65.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.65.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.65.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.66.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.66.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.66.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.66.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.66.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.66.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.67.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.67.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.67.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.67.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.67.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.67.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.68.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.68.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.68.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.68.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.68.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.68.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.69.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.69.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.69.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.69.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.69.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.69.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.70.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.70.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.70.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.70.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.70.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.70.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.71.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.71.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.71.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.71.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.71.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.71.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.72.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.72.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.72.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.72.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.72.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.72.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.73.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.73.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.73.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.73.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.73.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.73.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.74.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.74.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.74.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.74.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.74.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.74.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.75.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.75.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.75.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.75.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.75.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.75.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.76.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.76.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.76.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.76.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.76.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.76.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.77.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.77.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.77.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.77.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.77.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.77.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.78.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.78.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.78.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.78.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.78.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.78.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.79.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.79.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.79.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.79.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.79.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.79.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.80.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.80.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.80.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.80.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.80.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.80.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.81.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.81.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.81.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.81.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.81.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.81.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.82.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.82.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.82.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.82.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.82.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.82.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.83.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.83.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.83.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.83.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.83.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.83.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.84.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.84.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.84.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.84.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.84.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.84.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.85.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.85.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.85.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.85.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.85.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.85.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.86.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.86.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.86.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.86.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.86.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.86.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.87.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.87.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.87.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.87.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.87.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.87.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.88.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.88.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.88.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.88.up_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.88.down_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.88.down_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.89.gate_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.89.gate_proj.weight_scale_inv": "model-00131-of-000163.safetensors", "model.layers.50.mlp.experts.89.up_proj.weight": "model-00131-of-000163.safetensors", - "model.layers.50.mlp.experts.89.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.89.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.89.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.90.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.90.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.90.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.90.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.90.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.90.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.91.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.91.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.91.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.91.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.91.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.91.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.92.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.92.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.92.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.92.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.92.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.92.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.93.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.93.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.93.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.93.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.93.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.93.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.94.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.94.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.94.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.94.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.94.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.94.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.95.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.95.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.95.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.95.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.95.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.95.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.96.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.96.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.96.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.96.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.96.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.96.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.97.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.97.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.97.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.97.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.97.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.97.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.98.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.98.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.98.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.98.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.98.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.98.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.99.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.99.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.99.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.99.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.99.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.99.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.100.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.100.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.100.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.100.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.100.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.100.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.101.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.101.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.101.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.101.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.101.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.101.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.102.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.102.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.102.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.102.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.102.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.102.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.103.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.103.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.103.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.103.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.103.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.103.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.104.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.104.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.104.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.104.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.104.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.104.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.105.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.105.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.105.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.105.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.105.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.105.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.106.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.106.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.106.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.106.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.106.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.106.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.107.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.107.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.107.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.107.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.107.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.107.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.108.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.108.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.108.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.108.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.108.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.108.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.109.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.109.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.109.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.109.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.109.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.109.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.110.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.110.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.110.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.110.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.110.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.110.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.111.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.111.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.111.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.111.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.111.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.111.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.112.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.112.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.112.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.112.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.112.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.112.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.113.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.113.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.113.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.113.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.113.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.113.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.114.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.114.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.114.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.114.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.114.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.114.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.115.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.115.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.115.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.115.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.115.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.115.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.116.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.116.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.116.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.116.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.116.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.116.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.117.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.117.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.117.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.117.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.117.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.117.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.118.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.118.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.118.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.118.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.118.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.118.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.119.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.119.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.119.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.119.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.119.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.119.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.120.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.120.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.120.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.120.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.120.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.120.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.121.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.121.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.121.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.121.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.121.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.121.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.122.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.122.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.122.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.122.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.122.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.122.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.123.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.123.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.123.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.123.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.123.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.123.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.124.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.124.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.124.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.124.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.124.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.124.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.125.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.125.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.125.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.125.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.125.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.125.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.126.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.126.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.126.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.126.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.126.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.126.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.127.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.127.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.127.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.127.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.127.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.127.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.128.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.128.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.128.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.128.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.128.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.128.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.129.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.129.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.129.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.129.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.129.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.129.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.130.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.130.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.130.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.130.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.130.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.130.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.131.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.131.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.131.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.131.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.131.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.131.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.132.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.132.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.132.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.132.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.132.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.132.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.133.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.133.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.133.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.133.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.133.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.133.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.134.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.134.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.134.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.134.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.134.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.134.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.135.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.135.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.135.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.135.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.135.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.135.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.136.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.136.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.136.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.136.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.136.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.136.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.137.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.137.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.137.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.137.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.137.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.137.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.138.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.138.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.138.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.138.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.138.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.138.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.139.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.139.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.139.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.139.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.139.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.139.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.140.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.140.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.140.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.140.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.140.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.140.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.141.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.141.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.141.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.141.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.141.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.141.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.142.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.142.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.142.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.142.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.142.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.142.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.143.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.143.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.143.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.143.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.143.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.143.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.144.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.144.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.144.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.144.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.144.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.144.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.145.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.145.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.145.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.145.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.145.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.145.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.146.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.146.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.146.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.146.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.146.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.146.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.147.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.147.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.147.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.147.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.147.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.147.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.148.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.148.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.148.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.148.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.148.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.148.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.149.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.149.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.149.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.149.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.149.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.149.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.150.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.150.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.150.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.150.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.150.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.150.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.151.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.151.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.151.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.151.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.151.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.151.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.152.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.152.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.152.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.152.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.152.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.152.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.153.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.153.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.153.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.153.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.153.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.153.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.154.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.154.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.154.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.154.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.154.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.154.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.155.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.155.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.155.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.155.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.155.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.155.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.156.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.156.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.156.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.156.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.156.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.156.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.157.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.157.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.157.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.157.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.157.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.157.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.158.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.158.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.158.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.158.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.158.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.158.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.159.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.159.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.159.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.159.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.159.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.159.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.160.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.160.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.160.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.160.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.160.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.160.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.161.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.161.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.161.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.161.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.161.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.161.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.162.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.162.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.162.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.162.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.162.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.162.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.163.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.163.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.163.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.163.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.163.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.163.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.164.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.164.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.164.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.164.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.164.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.164.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.165.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.165.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.165.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.165.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.165.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.165.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.166.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.166.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.166.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.166.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.166.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.166.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.167.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.167.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.167.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.167.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.167.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.167.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.168.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.168.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.168.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.168.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.168.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.168.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.169.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.169.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.169.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.169.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.169.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.169.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.170.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.170.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.170.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.170.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.170.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.170.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.171.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.171.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.171.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.171.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.171.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.171.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.172.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.172.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.172.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.172.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.172.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.172.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.173.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.173.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.173.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.173.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.173.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.173.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.174.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.174.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.174.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.174.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.174.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.174.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.175.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.175.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.175.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.175.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.175.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.175.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.176.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.176.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.176.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.176.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.176.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.176.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.177.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.177.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.177.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.177.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.177.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.177.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.178.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.178.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.178.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.178.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.178.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.178.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.179.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.179.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.179.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.179.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.179.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.179.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.180.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.180.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.180.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.180.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.180.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.180.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.181.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.181.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.181.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.181.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.181.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.181.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.182.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.182.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.182.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.182.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.182.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.182.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.183.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.183.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.183.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.183.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.183.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.183.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.184.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.184.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.184.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.184.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.184.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.184.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.185.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.185.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.185.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.185.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.185.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.185.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.186.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.186.gate_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.186.up_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.186.up_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.186.down_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.186.down_proj.weight_scale_inv": "model-00132-of-000163.safetensors", "model.layers.50.mlp.experts.187.gate_proj.weight": "model-00132-of-000163.safetensors", - "model.layers.50.mlp.experts.187.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.187.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.187.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.187.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.187.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.188.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.188.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.188.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.188.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.188.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.188.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.189.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.189.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.189.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.189.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.189.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.189.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.190.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.190.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.190.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.190.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.190.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.190.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.191.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.191.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.191.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.191.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.191.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.191.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.192.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.192.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.192.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.192.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.192.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.192.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.193.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.193.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.193.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.193.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.193.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.193.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.194.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.194.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.194.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.194.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.194.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.194.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.195.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.195.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.195.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.195.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.195.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.195.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.196.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.196.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.196.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.196.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.196.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.196.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.197.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.197.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.197.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.197.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.197.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.197.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.198.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.198.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.198.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.198.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.198.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.198.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.199.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.199.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.199.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.199.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.199.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.199.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.200.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.200.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.200.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.200.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.200.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.200.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.201.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.201.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.201.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.201.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.201.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.201.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.202.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.202.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.202.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.202.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.202.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.202.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.203.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.203.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.203.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.203.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.203.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.203.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.204.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.204.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.204.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.204.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.204.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.204.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.205.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.205.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.205.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.205.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.205.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.205.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.206.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.206.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.206.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.206.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.206.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.206.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.207.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.207.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.207.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.207.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.207.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.207.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.208.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.208.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.208.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.208.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.208.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.208.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.209.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.209.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.209.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.209.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.209.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.209.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.210.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.210.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.210.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.210.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.210.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.210.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.211.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.211.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.211.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.211.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.211.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.211.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.212.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.212.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.212.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.212.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.212.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.212.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.213.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.213.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.213.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.213.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.213.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.213.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.214.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.214.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.214.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.214.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.214.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.214.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.215.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.215.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.215.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.215.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.215.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.215.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.216.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.216.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.216.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.216.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.216.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.216.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.217.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.217.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.217.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.217.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.217.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.217.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.218.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.218.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.218.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.218.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.218.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.218.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.219.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.219.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.219.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.219.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.219.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.219.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.220.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.220.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.220.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.220.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.220.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.220.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.221.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.221.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.221.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.221.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.221.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.221.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.222.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.222.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.222.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.222.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.222.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.222.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.223.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.223.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.223.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.223.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.223.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.223.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.224.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.224.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.224.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.224.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.224.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.224.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.225.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.225.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.225.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.225.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.225.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.225.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.226.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.226.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.226.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.226.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.226.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.226.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.227.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.227.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.227.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.227.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.227.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.227.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.228.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.228.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.228.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.228.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.228.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.228.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.229.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.229.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.229.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.229.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.229.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.229.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.230.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.230.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.230.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.230.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.230.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.230.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.231.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.231.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.231.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.231.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.231.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.231.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.232.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.232.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.232.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.232.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.232.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.232.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.233.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.233.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.233.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.233.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.233.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.233.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.234.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.234.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.234.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.234.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.234.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.234.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.235.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.235.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.235.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.235.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.235.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.235.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.236.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.236.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.236.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.236.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.236.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.236.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.237.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.237.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.237.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.237.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.237.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.237.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.238.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.238.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.238.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.238.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.238.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.238.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.239.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.239.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.239.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.239.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.239.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.239.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.240.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.240.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.240.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.240.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.240.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.240.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.241.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.241.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.241.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.241.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.241.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.241.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.242.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.242.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.242.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.242.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.242.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.242.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.243.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.243.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.243.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.243.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.243.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.243.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.244.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.244.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.244.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.244.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.244.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.244.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.245.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.245.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.245.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.245.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.245.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.245.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.246.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.246.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.246.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.246.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.246.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.246.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.247.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.247.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.247.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.247.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.247.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.247.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.248.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.248.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.248.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.248.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.248.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.248.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.249.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.249.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.249.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.249.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.249.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.249.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.250.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.250.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.250.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.250.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.250.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.250.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.251.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.251.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.251.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.251.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.251.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.251.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.252.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.252.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.252.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.252.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.252.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.252.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.253.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.253.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.253.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.253.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.253.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.253.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.254.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.254.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.254.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.254.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.254.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.254.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.255.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.255.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.255.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.255.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.mlp.experts.255.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.50.mlp.experts.255.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.50.input_layernorm.weight": "model-00133-of-000163.safetensors", "model.layers.50.post_attention_layernorm.weight": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.q_a_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.self_attn.q_a_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.q_a_layernorm.weight": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.q_b_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.self_attn.q_b_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.kv_a_proj_with_mqa.weight": "model-00133-of-000163.safetensors", - "model.layers.51.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.kv_a_layernorm.weight": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.kv_b_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.self_attn.kv_b_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.self_attn.o_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.self_attn.o_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.gate.weight": "model-00133-of-000163.safetensors", "model.layers.51.mlp.gate.e_score_correction_bias": "model-00133-of-000163.safetensors", "model.layers.51.mlp.shared_experts.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.shared_experts.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.shared_experts.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.shared_experts.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.shared_experts.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.0.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.0.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.0.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.0.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.0.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.0.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.1.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.1.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.1.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.1.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.1.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.1.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.2.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.2.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.2.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.2.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.2.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.2.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.3.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.3.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.3.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.3.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.3.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.3.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.4.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.4.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.4.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.4.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.4.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.4.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.5.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.5.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.5.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.5.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.5.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.5.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.6.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.6.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.6.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.6.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.6.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.6.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.7.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.7.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.7.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.7.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.7.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.7.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.8.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.8.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.8.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.8.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.8.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.8.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.9.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.9.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.9.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.9.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.9.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.9.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.10.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.10.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.10.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.10.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.10.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.10.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.11.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.11.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.11.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.11.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.11.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.11.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.12.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.12.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.12.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.12.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.12.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.12.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.13.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.13.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.13.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.13.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.13.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.13.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.14.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.14.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.14.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.14.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.14.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.14.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.15.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.15.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.15.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.15.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.15.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.15.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.16.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.16.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.16.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.16.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.16.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.16.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.17.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.17.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.17.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.17.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.17.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.17.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.18.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.18.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.18.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.18.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.18.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.18.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.19.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.19.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.19.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.19.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.19.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.19.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.20.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.20.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.20.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.20.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.20.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.20.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.21.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.21.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.21.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.21.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.21.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.21.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.22.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.22.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.22.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.22.up_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.22.down_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.22.down_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.23.gate_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.23.gate_proj.weight_scale_inv": "model-00133-of-000163.safetensors", "model.layers.51.mlp.experts.23.up_proj.weight": "model-00133-of-000163.safetensors", - "model.layers.51.mlp.experts.23.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.23.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.23.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.24.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.24.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.24.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.24.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.24.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.24.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.25.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.25.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.25.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.25.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.25.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.25.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.26.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.26.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.26.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.26.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.26.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.26.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.27.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.27.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.27.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.27.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.27.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.27.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.28.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.28.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.28.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.28.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.28.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.28.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.29.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.29.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.29.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.29.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.29.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.29.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.30.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.30.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.30.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.30.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.30.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.30.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.31.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.31.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.31.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.31.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.31.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.31.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.32.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.32.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.32.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.32.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.32.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.32.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.33.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.33.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.33.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.33.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.33.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.33.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.34.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.34.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.34.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.34.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.34.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.34.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.35.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.35.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.35.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.35.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.35.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.35.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.36.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.36.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.36.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.36.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.36.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.36.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.37.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.37.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.37.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.37.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.37.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.37.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.38.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.38.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.38.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.38.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.38.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.38.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.39.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.39.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.39.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.39.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.39.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.39.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.40.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.40.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.40.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.40.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.40.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.40.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.41.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.41.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.41.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.41.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.41.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.41.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.42.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.42.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.42.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.42.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.42.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.42.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.43.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.43.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.43.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.43.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.43.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.43.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.44.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.44.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.44.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.44.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.44.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.44.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.45.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.45.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.45.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.45.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.45.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.45.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.46.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.46.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.46.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.46.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.46.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.46.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.47.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.47.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.47.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.47.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.47.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.47.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.48.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.48.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.48.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.48.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.48.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.48.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.49.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.49.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.49.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.49.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.49.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.49.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.50.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.50.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.50.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.50.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.50.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.50.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.51.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.51.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.51.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.51.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.51.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.51.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.52.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.52.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.52.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.52.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.52.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.52.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.53.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.53.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.53.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.53.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.53.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.53.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.54.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.54.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.54.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.54.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.54.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.54.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.55.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.55.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.55.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.55.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.55.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.55.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.56.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.56.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.56.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.56.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.56.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.56.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.57.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.57.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.57.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.57.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.57.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.57.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.58.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.58.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.58.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.58.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.58.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.58.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.59.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.59.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.59.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.59.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.59.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.59.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.60.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.60.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.60.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.60.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.60.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.60.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.61.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.61.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.61.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.61.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.61.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.61.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.62.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.62.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.62.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.62.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.62.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.62.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.63.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.63.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.63.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.63.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.63.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.63.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.64.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.64.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.64.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.64.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.64.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.64.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.65.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.65.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.65.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.65.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.65.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.65.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.66.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.66.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.66.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.66.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.66.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.66.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.67.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.67.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.67.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.67.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.67.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.67.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.68.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.68.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.68.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.68.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.68.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.68.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.69.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.69.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.69.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.69.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.69.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.69.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.70.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.70.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.70.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.70.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.70.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.70.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.71.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.71.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.71.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.71.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.71.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.71.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.72.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.72.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.72.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.72.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.72.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.72.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.73.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.73.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.73.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.73.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.73.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.73.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.74.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.74.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.74.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.74.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.74.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.74.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.75.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.75.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.75.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.75.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.75.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.75.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.76.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.76.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.76.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.76.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.76.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.76.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.77.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.77.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.77.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.77.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.77.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.77.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.78.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.78.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.78.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.78.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.78.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.78.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.79.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.79.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.79.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.79.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.79.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.79.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.80.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.80.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.80.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.80.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.80.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.80.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.81.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.81.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.81.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.81.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.81.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.81.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.82.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.82.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.82.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.82.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.82.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.82.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.83.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.83.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.83.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.83.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.83.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.83.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.84.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.84.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.84.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.84.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.84.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.84.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.85.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.85.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.85.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.85.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.85.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.85.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.86.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.86.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.86.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.86.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.86.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.86.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.87.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.87.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.87.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.87.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.87.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.87.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.88.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.88.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.88.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.88.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.88.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.88.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.89.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.89.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.89.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.89.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.89.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.89.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.90.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.90.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.90.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.90.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.90.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.90.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.91.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.91.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.91.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.91.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.91.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.91.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.92.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.92.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.92.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.92.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.92.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.92.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.93.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.93.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.93.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.93.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.93.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.93.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.94.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.94.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.94.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.94.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.94.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.94.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.95.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.95.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.95.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.95.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.95.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.95.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.96.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.96.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.96.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.96.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.96.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.96.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.97.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.97.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.97.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.97.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.97.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.97.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.98.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.98.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.98.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.98.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.98.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.98.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.99.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.99.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.99.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.99.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.99.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.99.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.100.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.100.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.100.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.100.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.100.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.100.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.101.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.101.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.101.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.101.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.101.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.101.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.102.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.102.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.102.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.102.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.102.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.102.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.103.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.103.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.103.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.103.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.103.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.103.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.104.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.104.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.104.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.104.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.104.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.104.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.105.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.105.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.105.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.105.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.105.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.105.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.106.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.106.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.106.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.106.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.106.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.106.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.107.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.107.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.107.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.107.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.107.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.107.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.108.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.108.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.108.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.108.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.108.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.108.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.109.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.109.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.109.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.109.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.109.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.109.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.110.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.110.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.110.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.110.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.110.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.110.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.111.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.111.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.111.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.111.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.111.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.111.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.112.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.112.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.112.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.112.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.112.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.112.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.113.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.113.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.113.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.113.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.113.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.113.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.114.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.114.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.114.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.114.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.114.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.114.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.115.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.115.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.115.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.115.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.115.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.115.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.116.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.116.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.116.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.116.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.116.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.116.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.117.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.117.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.117.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.117.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.117.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.117.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.118.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.118.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.118.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.118.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.118.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.118.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.119.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.119.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.119.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.119.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.119.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.119.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.120.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.120.gate_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.120.up_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.120.up_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.120.down_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.120.down_proj.weight_scale_inv": "model-00134-of-000163.safetensors", "model.layers.51.mlp.experts.121.gate_proj.weight": "model-00134-of-000163.safetensors", - "model.layers.51.mlp.experts.121.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.121.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.121.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.121.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.121.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.122.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.122.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.122.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.122.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.122.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.122.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.123.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.123.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.123.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.123.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.123.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.123.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.124.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.124.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.124.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.124.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.124.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.124.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.125.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.125.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.125.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.125.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.125.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.125.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.126.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.126.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.126.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.126.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.126.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.126.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.127.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.127.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.127.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.127.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.127.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.127.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.128.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.128.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.128.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.128.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.128.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.128.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.129.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.129.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.129.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.129.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.129.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.129.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.130.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.130.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.130.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.130.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.130.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.130.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.131.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.131.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.131.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.131.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.131.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.131.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.132.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.132.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.132.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.132.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.132.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.132.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.133.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.133.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.133.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.133.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.133.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.133.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.134.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.134.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.134.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.134.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.134.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.134.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.135.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.135.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.135.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.135.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.135.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.135.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.136.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.136.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.136.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.136.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.136.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.136.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.137.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.137.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.137.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.137.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.137.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.137.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.138.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.138.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.138.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.138.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.138.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.138.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.139.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.139.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.139.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.139.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.139.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.139.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.140.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.140.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.140.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.140.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.140.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.140.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.141.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.141.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.141.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.141.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.141.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.141.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.142.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.142.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.142.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.142.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.142.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.142.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.143.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.143.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.143.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.143.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.143.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.143.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.144.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.144.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.144.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.144.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.144.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.144.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.145.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.145.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.145.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.145.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.145.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.145.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.146.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.146.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.146.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.146.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.146.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.146.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.147.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.147.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.147.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.147.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.147.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.147.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.148.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.148.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.148.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.148.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.148.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.148.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.149.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.149.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.149.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.149.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.149.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.149.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.150.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.150.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.150.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.150.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.150.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.150.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.151.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.151.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.151.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.151.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.151.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.151.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.152.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.152.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.152.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.152.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.152.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.152.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.153.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.153.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.153.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.153.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.153.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.153.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.154.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.154.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.154.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.154.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.154.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.154.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.155.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.155.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.155.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.155.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.155.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.155.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.156.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.156.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.156.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.156.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.156.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.156.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.157.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.157.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.157.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.157.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.157.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.157.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.158.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.158.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.158.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.158.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.158.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.158.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.159.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.159.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.159.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.159.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.159.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.159.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.160.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.160.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.160.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.160.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.160.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.160.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.161.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.161.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.161.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.161.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.161.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.161.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.162.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.162.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.162.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.162.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.162.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.162.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.163.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.163.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.163.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.163.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.163.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.163.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.164.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.164.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.164.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.164.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.164.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.164.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.165.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.165.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.165.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.165.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.165.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.165.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.166.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.166.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.166.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.166.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.166.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.166.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.167.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.167.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.167.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.167.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.167.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.167.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.168.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.168.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.168.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.168.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.168.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.168.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.169.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.169.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.169.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.169.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.169.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.169.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.170.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.170.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.170.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.170.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.170.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.170.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.171.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.171.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.171.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.171.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.171.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.171.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.172.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.172.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.172.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.172.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.172.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.172.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.173.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.173.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.173.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.173.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.173.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.173.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.174.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.174.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.174.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.174.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.174.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.174.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.175.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.175.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.175.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.175.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.175.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.175.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.176.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.176.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.176.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.176.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.176.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.176.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.177.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.177.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.177.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.177.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.177.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.177.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.178.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.178.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.178.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.178.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.178.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.178.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.179.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.179.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.179.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.179.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.179.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.179.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.180.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.180.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.180.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.180.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.180.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.180.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.181.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.181.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.181.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.181.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.181.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.181.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.182.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.182.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.182.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.182.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.182.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.182.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.183.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.183.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.183.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.183.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.183.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.183.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.184.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.184.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.184.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.184.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.184.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.184.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.185.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.185.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.185.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.185.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.185.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.185.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.186.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.186.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.186.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.186.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.186.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.186.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.187.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.187.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.187.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.187.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.187.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.187.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.188.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.188.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.188.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.188.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.188.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.188.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.189.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.189.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.189.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.189.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.189.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.189.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.190.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.190.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.190.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.190.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.190.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.190.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.191.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.191.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.191.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.191.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.191.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.191.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.192.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.192.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.192.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.192.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.192.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.192.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.193.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.193.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.193.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.193.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.193.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.193.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.194.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.194.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.194.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.194.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.194.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.194.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.195.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.195.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.195.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.195.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.195.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.195.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.196.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.196.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.196.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.196.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.196.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.196.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.197.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.197.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.197.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.197.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.197.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.197.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.198.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.198.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.198.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.198.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.198.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.198.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.199.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.199.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.199.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.199.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.199.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.199.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.200.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.200.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.200.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.200.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.200.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.200.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.201.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.201.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.201.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.201.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.201.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.201.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.202.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.202.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.202.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.202.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.202.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.202.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.203.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.203.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.203.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.203.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.203.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.203.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.204.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.204.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.204.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.204.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.204.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.204.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.205.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.205.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.205.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.205.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.205.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.205.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.206.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.206.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.206.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.206.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.206.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.206.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.207.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.207.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.207.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.207.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.207.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.207.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.208.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.208.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.208.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.208.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.208.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.208.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.209.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.209.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.209.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.209.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.209.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.209.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.210.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.210.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.210.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.210.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.210.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.210.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.211.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.211.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.211.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.211.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.211.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.211.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.212.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.212.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.212.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.212.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.212.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.212.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.213.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.213.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.213.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.213.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.213.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.213.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.214.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.214.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.214.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.214.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.214.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.214.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.215.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.215.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.215.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.215.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.215.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.215.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.216.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.216.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.216.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.216.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.216.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.216.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.217.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.217.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.217.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.217.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.217.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.217.down_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.218.gate_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.218.gate_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.218.up_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.218.up_proj.weight_scale_inv": "model-00135-of-000163.safetensors", "model.layers.51.mlp.experts.218.down_proj.weight": "model-00135-of-000163.safetensors", - "model.layers.51.mlp.experts.218.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.219.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.219.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.219.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.219.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.219.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.219.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.220.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.220.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.220.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.220.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.220.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.220.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.221.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.221.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.221.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.221.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.221.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.221.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.222.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.222.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.222.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.222.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.222.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.222.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.223.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.223.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.223.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.223.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.223.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.223.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.224.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.224.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.224.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.224.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.224.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.224.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.225.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.225.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.225.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.225.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.225.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.225.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.226.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.226.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.226.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.226.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.226.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.226.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.227.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.227.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.227.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.227.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.227.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.227.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.228.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.228.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.228.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.228.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.228.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.228.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.229.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.229.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.229.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.229.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.229.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.229.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.230.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.230.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.230.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.230.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.230.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.230.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.231.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.231.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.231.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.231.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.231.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.231.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.232.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.232.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.232.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.232.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.232.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.232.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.233.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.233.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.233.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.233.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.233.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.233.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.234.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.234.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.234.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.234.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.234.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.234.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.235.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.235.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.235.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.235.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.235.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.235.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.236.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.236.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.236.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.236.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.236.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.236.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.237.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.237.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.237.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.237.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.237.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.237.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.238.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.238.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.238.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.238.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.238.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.238.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.239.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.239.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.239.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.239.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.239.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.239.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.240.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.240.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.240.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.240.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.240.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.240.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.241.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.241.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.241.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.241.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.241.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.241.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.242.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.242.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.242.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.242.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.242.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.242.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.243.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.243.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.243.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.243.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.243.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.243.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.244.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.244.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.244.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.244.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.244.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.244.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.245.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.245.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.245.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.245.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.245.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.245.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.246.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.246.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.246.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.246.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.246.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.246.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.247.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.247.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.247.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.247.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.247.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.247.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.248.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.248.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.248.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.248.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.248.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.248.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.249.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.249.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.249.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.249.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.249.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.249.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.250.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.250.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.250.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.250.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.250.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.250.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.251.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.251.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.251.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.251.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.251.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.251.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.252.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.252.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.252.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.252.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.252.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.252.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.253.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.253.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.253.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.253.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.253.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.253.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.254.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.254.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.254.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.254.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.254.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.254.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.255.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.255.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.255.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.255.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.mlp.experts.255.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.51.mlp.experts.255.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.51.input_layernorm.weight": "model-00136-of-000163.safetensors", "model.layers.51.post_attention_layernorm.weight": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.q_a_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.self_attn.q_a_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.q_a_layernorm.weight": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.q_b_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.self_attn.q_b_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.kv_a_proj_with_mqa.weight": "model-00136-of-000163.safetensors", - "model.layers.52.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.kv_a_layernorm.weight": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.kv_b_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.self_attn.kv_b_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.self_attn.o_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.self_attn.o_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.gate.weight": "model-00136-of-000163.safetensors", "model.layers.52.mlp.gate.e_score_correction_bias": "model-00136-of-000163.safetensors", "model.layers.52.mlp.shared_experts.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.shared_experts.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.shared_experts.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.shared_experts.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.shared_experts.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.0.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.0.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.0.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.0.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.0.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.0.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.1.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.1.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.1.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.1.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.1.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.1.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.2.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.2.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.2.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.2.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.2.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.2.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.3.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.3.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.3.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.3.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.3.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.3.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.4.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.4.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.4.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.4.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.4.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.4.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.5.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.5.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.5.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.5.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.5.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.5.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.6.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.6.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.6.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.6.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.6.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.6.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.7.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.7.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.7.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.7.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.7.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.7.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.8.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.8.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.8.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.8.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.8.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.8.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.9.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.9.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.9.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.9.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.9.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.9.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.10.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.10.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.10.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.10.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.10.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.10.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.11.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.11.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.11.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.11.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.11.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.11.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.12.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.12.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.12.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.12.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.12.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.12.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.13.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.13.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.13.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.13.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.13.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.13.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.14.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.14.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.14.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.14.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.14.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.14.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.15.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.15.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.15.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.15.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.15.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.15.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.16.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.16.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.16.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.16.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.16.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.16.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.17.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.17.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.17.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.17.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.17.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.17.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.18.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.18.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.18.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.18.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.18.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.18.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.19.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.19.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.19.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.19.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.19.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.19.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.20.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.20.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.20.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.20.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.20.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.20.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.21.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.21.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.21.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.21.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.21.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.21.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.22.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.22.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.22.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.22.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.22.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.22.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.23.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.23.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.23.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.23.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.23.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.23.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.24.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.24.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.24.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.24.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.24.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.24.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.25.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.25.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.25.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.25.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.25.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.25.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.26.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.26.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.26.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.26.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.26.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.26.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.27.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.27.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.27.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.27.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.27.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.27.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.28.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.28.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.28.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.28.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.28.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.28.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.29.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.29.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.29.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.29.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.29.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.29.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.30.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.30.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.30.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.30.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.30.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.30.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.31.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.31.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.31.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.31.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.31.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.31.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.32.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.32.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.32.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.32.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.32.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.32.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.33.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.33.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.33.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.33.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.33.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.33.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.34.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.34.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.34.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.34.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.34.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.34.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.35.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.35.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.35.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.35.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.35.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.35.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.36.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.36.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.36.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.36.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.36.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.36.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.37.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.37.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.37.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.37.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.37.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.37.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.38.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.38.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.38.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.38.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.38.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.38.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.39.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.39.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.39.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.39.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.39.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.39.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.40.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.40.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.40.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.40.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.40.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.40.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.41.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.41.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.41.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.41.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.41.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.41.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.42.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.42.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.42.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.42.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.42.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.42.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.43.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.43.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.43.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.43.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.43.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.43.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.44.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.44.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.44.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.44.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.44.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.44.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.45.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.45.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.45.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.45.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.45.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.45.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.46.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.46.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.46.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.46.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.46.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.46.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.47.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.47.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.47.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.47.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.47.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.47.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.48.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.48.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.48.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.48.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.48.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.48.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.49.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.49.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.49.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.49.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.49.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.49.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.50.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.50.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.50.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.50.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.50.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.50.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.51.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.51.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.51.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.51.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.51.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.51.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.52.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.52.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.52.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.52.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.52.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.52.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.53.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.53.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.53.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.53.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.53.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.53.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.54.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.54.gate_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.54.up_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.54.up_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.54.down_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.54.down_proj.weight_scale_inv": "model-00136-of-000163.safetensors", "model.layers.52.mlp.experts.55.gate_proj.weight": "model-00136-of-000163.safetensors", - "model.layers.52.mlp.experts.55.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.55.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.55.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.55.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.55.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.56.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.56.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.56.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.56.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.56.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.56.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.57.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.57.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.57.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.57.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.57.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.57.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.58.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.58.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.58.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.58.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.58.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.58.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.59.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.59.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.59.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.59.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.59.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.59.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.60.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.60.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.60.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.60.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.60.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.60.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.61.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.61.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.61.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.61.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.61.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.61.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.62.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.62.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.62.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.62.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.62.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.62.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.63.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.63.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.63.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.63.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.63.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.63.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.64.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.64.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.64.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.64.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.64.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.64.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.65.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.65.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.65.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.65.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.65.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.65.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.66.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.66.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.66.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.66.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.66.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.66.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.67.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.67.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.67.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.67.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.67.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.67.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.68.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.68.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.68.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.68.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.68.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.68.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.69.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.69.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.69.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.69.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.69.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.69.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.70.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.70.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.70.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.70.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.70.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.70.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.71.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.71.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.71.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.71.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.71.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.71.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.72.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.72.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.72.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.72.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.72.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.72.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.73.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.73.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.73.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.73.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.73.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.73.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.74.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.74.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.74.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.74.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.74.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.74.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.75.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.75.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.75.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.75.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.75.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.75.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.76.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.76.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.76.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.76.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.76.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.76.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.77.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.77.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.77.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.77.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.77.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.77.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.78.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.78.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.78.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.78.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.78.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.78.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.79.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.79.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.79.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.79.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.79.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.79.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.80.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.80.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.80.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.80.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.80.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.80.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.81.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.81.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.81.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.81.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.81.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.81.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.82.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.82.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.82.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.82.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.82.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.82.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.83.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.83.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.83.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.83.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.83.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.83.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.84.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.84.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.84.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.84.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.84.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.84.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.85.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.85.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.85.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.85.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.85.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.85.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.86.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.86.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.86.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.86.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.86.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.86.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.87.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.87.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.87.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.87.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.87.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.87.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.88.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.88.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.88.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.88.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.88.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.88.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.89.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.89.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.89.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.89.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.89.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.89.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.90.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.90.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.90.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.90.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.90.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.90.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.91.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.91.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.91.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.91.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.91.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.91.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.92.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.92.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.92.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.92.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.92.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.92.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.93.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.93.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.93.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.93.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.93.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.93.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.94.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.94.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.94.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.94.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.94.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.94.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.95.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.95.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.95.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.95.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.95.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.95.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.96.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.96.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.96.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.96.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.96.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.96.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.97.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.97.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.97.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.97.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.97.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.97.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.98.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.98.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.98.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.98.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.98.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.98.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.99.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.99.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.99.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.99.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.99.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.99.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.100.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.100.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.100.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.100.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.100.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.100.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.101.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.101.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.101.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.101.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.101.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.101.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.102.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.102.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.102.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.102.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.102.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.102.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.103.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.103.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.103.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.103.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.103.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.103.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.104.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.104.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.104.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.104.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.104.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.104.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.105.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.105.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.105.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.105.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.105.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.105.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.106.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.106.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.106.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.106.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.106.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.106.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.107.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.107.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.107.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.107.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.107.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.107.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.108.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.108.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.108.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.108.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.108.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.108.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.109.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.109.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.109.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.109.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.109.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.109.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.110.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.110.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.110.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.110.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.110.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.110.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.111.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.111.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.111.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.111.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.111.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.111.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.112.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.112.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.112.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.112.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.112.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.112.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.113.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.113.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.113.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.113.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.113.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.113.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.114.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.114.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.114.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.114.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.114.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.114.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.115.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.115.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.115.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.115.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.115.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.115.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.116.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.116.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.116.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.116.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.116.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.116.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.117.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.117.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.117.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.117.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.117.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.117.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.118.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.118.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.118.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.118.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.118.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.118.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.119.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.119.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.119.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.119.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.119.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.119.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.120.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.120.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.120.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.120.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.120.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.120.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.121.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.121.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.121.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.121.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.121.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.121.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.122.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.122.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.122.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.122.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.122.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.122.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.123.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.123.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.123.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.123.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.123.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.123.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.124.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.124.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.124.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.124.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.124.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.124.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.125.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.125.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.125.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.125.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.125.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.125.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.126.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.126.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.126.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.126.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.126.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.126.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.127.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.127.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.127.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.127.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.127.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.127.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.128.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.128.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.128.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.128.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.128.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.128.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.129.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.129.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.129.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.129.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.129.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.129.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.130.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.130.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.130.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.130.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.130.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.130.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.131.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.131.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.131.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.131.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.131.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.131.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.132.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.132.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.132.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.132.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.132.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.132.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.133.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.133.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.133.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.133.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.133.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.133.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.134.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.134.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.134.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.134.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.134.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.134.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.135.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.135.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.135.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.135.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.135.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.135.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.136.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.136.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.136.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.136.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.136.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.136.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.137.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.137.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.137.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.137.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.137.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.137.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.138.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.138.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.138.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.138.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.138.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.138.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.139.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.139.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.139.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.139.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.139.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.139.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.140.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.140.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.140.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.140.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.140.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.140.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.141.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.141.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.141.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.141.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.141.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.141.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.142.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.142.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.142.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.142.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.142.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.142.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.143.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.143.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.143.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.143.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.143.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.143.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.144.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.144.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.144.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.144.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.144.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.144.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.145.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.145.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.145.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.145.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.145.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.145.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.146.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.146.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.146.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.146.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.146.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.146.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.147.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.147.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.147.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.147.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.147.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.147.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.148.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.148.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.148.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.148.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.148.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.148.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.149.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.149.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.149.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.149.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.149.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.149.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.150.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.150.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.150.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.150.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.150.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.150.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.151.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.151.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.151.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.151.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.151.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.151.down_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.152.gate_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.152.gate_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.152.up_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.152.up_proj.weight_scale_inv": "model-00137-of-000163.safetensors", "model.layers.52.mlp.experts.152.down_proj.weight": "model-00137-of-000163.safetensors", - "model.layers.52.mlp.experts.152.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.153.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.153.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.153.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.153.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.153.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.153.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.154.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.154.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.154.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.154.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.154.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.154.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.155.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.155.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.155.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.155.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.155.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.155.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.156.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.156.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.156.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.156.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.156.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.156.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.157.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.157.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.157.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.157.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.157.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.157.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.158.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.158.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.158.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.158.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.158.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.158.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.159.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.159.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.159.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.159.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.159.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.159.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.160.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.160.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.160.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.160.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.160.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.160.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.161.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.161.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.161.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.161.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.161.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.161.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.162.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.162.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.162.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.162.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.162.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.162.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.163.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.163.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.163.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.163.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.163.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.163.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.164.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.164.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.164.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.164.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.164.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.164.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.165.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.165.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.165.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.165.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.165.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.165.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.166.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.166.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.166.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.166.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.166.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.166.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.167.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.167.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.167.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.167.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.167.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.167.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.168.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.168.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.168.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.168.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.168.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.168.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.169.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.169.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.169.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.169.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.169.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.169.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.170.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.170.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.170.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.170.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.170.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.170.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.171.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.171.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.171.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.171.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.171.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.171.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.172.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.172.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.172.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.172.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.172.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.172.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.173.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.173.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.173.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.173.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.173.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.173.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.174.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.174.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.174.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.174.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.174.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.174.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.175.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.175.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.175.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.175.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.175.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.175.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.176.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.176.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.176.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.176.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.176.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.176.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.177.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.177.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.177.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.177.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.177.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.177.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.178.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.178.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.178.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.178.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.178.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.178.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.179.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.179.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.179.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.179.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.179.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.179.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.180.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.180.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.180.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.180.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.180.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.180.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.181.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.181.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.181.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.181.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.181.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.181.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.182.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.182.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.182.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.182.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.182.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.182.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.183.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.183.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.183.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.183.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.183.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.183.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.184.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.184.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.184.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.184.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.184.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.184.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.185.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.185.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.185.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.185.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.185.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.185.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.186.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.186.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.186.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.186.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.186.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.186.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.187.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.187.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.187.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.187.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.187.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.187.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.188.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.188.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.188.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.188.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.188.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.188.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.189.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.189.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.189.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.189.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.189.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.189.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.190.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.190.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.190.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.190.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.190.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.190.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.191.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.191.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.191.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.191.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.191.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.191.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.192.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.192.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.192.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.192.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.192.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.192.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.193.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.193.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.193.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.193.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.193.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.193.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.194.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.194.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.194.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.194.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.194.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.194.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.195.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.195.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.195.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.195.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.195.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.195.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.196.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.196.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.196.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.196.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.196.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.196.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.197.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.197.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.197.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.197.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.197.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.197.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.198.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.198.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.198.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.198.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.198.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.198.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.199.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.199.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.199.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.199.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.199.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.199.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.200.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.200.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.200.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.200.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.200.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.200.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.201.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.201.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.201.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.201.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.201.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.201.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.202.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.202.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.202.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.202.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.202.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.202.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.203.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.203.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.203.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.203.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.203.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.203.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.204.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.204.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.204.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.204.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.204.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.204.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.205.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.205.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.205.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.205.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.205.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.205.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.206.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.206.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.206.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.206.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.206.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.206.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.207.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.207.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.207.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.207.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.207.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.207.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.208.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.208.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.208.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.208.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.208.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.208.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.209.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.209.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.209.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.209.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.209.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.209.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.210.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.210.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.210.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.210.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.210.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.210.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.211.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.211.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.211.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.211.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.211.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.211.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.212.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.212.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.212.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.212.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.212.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.212.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.213.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.213.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.213.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.213.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.213.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.213.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.214.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.214.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.214.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.214.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.214.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.214.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.215.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.215.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.215.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.215.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.215.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.215.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.216.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.216.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.216.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.216.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.216.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.216.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.217.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.217.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.217.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.217.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.217.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.217.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.218.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.218.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.218.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.218.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.218.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.218.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.219.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.219.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.219.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.219.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.219.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.219.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.220.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.220.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.220.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.220.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.220.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.220.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.221.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.221.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.221.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.221.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.221.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.221.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.222.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.222.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.222.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.222.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.222.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.222.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.223.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.223.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.223.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.223.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.223.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.223.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.224.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.224.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.224.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.224.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.224.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.224.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.225.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.225.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.225.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.225.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.225.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.225.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.226.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.226.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.226.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.226.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.226.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.226.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.227.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.227.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.227.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.227.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.227.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.227.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.228.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.228.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.228.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.228.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.228.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.228.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.229.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.229.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.229.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.229.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.229.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.229.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.230.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.230.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.230.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.230.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.230.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.230.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.231.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.231.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.231.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.231.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.231.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.231.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.232.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.232.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.232.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.232.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.232.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.232.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.233.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.233.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.233.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.233.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.233.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.233.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.234.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.234.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.234.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.234.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.234.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.234.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.235.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.235.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.235.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.235.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.235.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.235.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.236.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.236.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.236.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.236.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.236.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.236.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.237.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.237.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.237.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.237.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.237.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.237.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.238.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.238.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.238.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.238.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.238.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.238.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.239.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.239.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.239.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.239.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.239.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.239.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.240.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.240.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.240.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.240.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.240.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.240.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.241.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.241.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.241.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.241.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.241.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.241.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.242.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.242.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.242.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.242.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.242.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.242.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.243.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.243.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.243.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.243.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.243.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.243.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.244.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.244.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.244.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.244.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.244.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.244.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.245.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.245.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.245.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.245.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.245.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.245.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.246.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.246.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.246.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.246.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.246.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.246.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.247.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.247.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.247.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.247.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.247.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.247.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.248.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.248.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.248.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.248.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.248.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.248.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.249.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.249.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.249.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.249.up_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.249.down_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.249.down_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.250.gate_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.250.gate_proj.weight_scale_inv": "model-00138-of-000163.safetensors", "model.layers.52.mlp.experts.250.up_proj.weight": "model-00138-of-000163.safetensors", - "model.layers.52.mlp.experts.250.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.250.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.250.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.251.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.251.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.251.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.251.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.251.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.251.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.252.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.252.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.252.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.252.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.252.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.252.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.253.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.253.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.253.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.253.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.253.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.253.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.254.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.254.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.254.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.254.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.254.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.254.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.255.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.255.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.255.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.255.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.mlp.experts.255.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.52.mlp.experts.255.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.52.input_layernorm.weight": "model-00139-of-000163.safetensors", "model.layers.52.post_attention_layernorm.weight": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.q_a_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.self_attn.q_a_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.q_a_layernorm.weight": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.q_b_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.self_attn.q_b_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.kv_a_proj_with_mqa.weight": "model-00139-of-000163.safetensors", - "model.layers.53.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.kv_a_layernorm.weight": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.kv_b_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.self_attn.kv_b_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.self_attn.o_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.self_attn.o_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.gate.weight": "model-00139-of-000163.safetensors", "model.layers.53.mlp.gate.e_score_correction_bias": "model-00139-of-000163.safetensors", "model.layers.53.mlp.shared_experts.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.shared_experts.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.shared_experts.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.shared_experts.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.shared_experts.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.0.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.0.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.0.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.0.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.0.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.0.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.1.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.1.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.1.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.1.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.1.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.1.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.2.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.2.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.2.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.2.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.2.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.2.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.3.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.3.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.3.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.3.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.3.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.3.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.4.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.4.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.4.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.4.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.4.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.4.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.5.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.5.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.5.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.5.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.5.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.5.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.6.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.6.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.6.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.6.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.6.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.6.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.7.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.7.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.7.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.7.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.7.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.7.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.8.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.8.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.8.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.8.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.8.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.8.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.9.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.9.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.9.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.9.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.9.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.9.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.10.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.10.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.10.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.10.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.10.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.10.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.11.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.11.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.11.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.11.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.11.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.11.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.12.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.12.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.12.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.12.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.12.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.12.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.13.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.13.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.13.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.13.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.13.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.13.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.14.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.14.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.14.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.14.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.14.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.14.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.15.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.15.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.15.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.15.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.15.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.15.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.16.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.16.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.16.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.16.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.16.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.16.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.17.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.17.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.17.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.17.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.17.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.17.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.18.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.18.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.18.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.18.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.18.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.18.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.19.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.19.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.19.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.19.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.19.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.19.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.20.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.20.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.20.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.20.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.20.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.20.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.21.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.21.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.21.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.21.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.21.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.21.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.22.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.22.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.22.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.22.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.22.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.22.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.23.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.23.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.23.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.23.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.23.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.23.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.24.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.24.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.24.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.24.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.24.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.24.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.25.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.25.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.25.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.25.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.25.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.25.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.26.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.26.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.26.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.26.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.26.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.26.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.27.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.27.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.27.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.27.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.27.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.27.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.28.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.28.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.28.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.28.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.28.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.28.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.29.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.29.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.29.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.29.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.29.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.29.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.30.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.30.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.30.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.30.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.30.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.30.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.31.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.31.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.31.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.31.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.31.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.31.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.32.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.32.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.32.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.32.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.32.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.32.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.33.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.33.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.33.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.33.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.33.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.33.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.34.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.34.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.34.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.34.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.34.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.34.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.35.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.35.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.35.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.35.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.35.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.35.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.36.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.36.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.36.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.36.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.36.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.36.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.37.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.37.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.37.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.37.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.37.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.37.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.38.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.38.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.38.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.38.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.38.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.38.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.39.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.39.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.39.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.39.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.39.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.39.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.40.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.40.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.40.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.40.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.40.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.40.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.41.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.41.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.41.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.41.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.41.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.41.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.42.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.42.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.42.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.42.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.42.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.42.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.43.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.43.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.43.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.43.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.43.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.43.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.44.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.44.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.44.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.44.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.44.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.44.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.45.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.45.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.45.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.45.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.45.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.45.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.46.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.46.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.46.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.46.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.46.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.46.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.47.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.47.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.47.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.47.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.47.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.47.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.48.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.48.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.48.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.48.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.48.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.48.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.49.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.49.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.49.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.49.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.49.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.49.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.50.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.50.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.50.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.50.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.50.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.50.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.51.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.51.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.51.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.51.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.51.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.51.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.52.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.52.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.52.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.52.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.52.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.52.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.53.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.53.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.53.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.53.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.53.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.53.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.54.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.54.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.54.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.54.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.54.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.54.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.55.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.55.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.55.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.55.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.55.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.55.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.56.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.56.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.56.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.56.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.56.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.56.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.57.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.57.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.57.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.57.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.57.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.57.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.58.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.58.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.58.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.58.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.58.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.58.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.59.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.59.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.59.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.59.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.59.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.59.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.60.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.60.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.60.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.60.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.60.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.60.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.61.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.61.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.61.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.61.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.61.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.61.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.62.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.62.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.62.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.62.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.62.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.62.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.63.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.63.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.63.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.63.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.63.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.63.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.64.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.64.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.64.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.64.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.64.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.64.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.65.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.65.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.65.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.65.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.65.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.65.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.66.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.66.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.66.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.66.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.66.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.66.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.67.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.67.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.67.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.67.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.67.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.67.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.68.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.68.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.68.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.68.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.68.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.68.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.69.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.69.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.69.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.69.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.69.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.69.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.70.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.70.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.70.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.70.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.70.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.70.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.71.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.71.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.71.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.71.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.71.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.71.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.72.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.72.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.72.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.72.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.72.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.72.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.73.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.73.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.73.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.73.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.73.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.73.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.74.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.74.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.74.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.74.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.74.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.74.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.75.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.75.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.75.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.75.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.75.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.75.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.76.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.76.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.76.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.76.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.76.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.76.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.77.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.77.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.77.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.77.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.77.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.77.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.78.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.78.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.78.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.78.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.78.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.78.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.79.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.79.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.79.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.79.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.79.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.79.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.80.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.80.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.80.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.80.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.80.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.80.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.81.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.81.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.81.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.81.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.81.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.81.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.82.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.82.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.82.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.82.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.82.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.82.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.83.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.83.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.83.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.83.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.83.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.83.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.84.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.84.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.84.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.84.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.84.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.84.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.85.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.85.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.85.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.85.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.85.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.85.down_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.86.gate_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.86.gate_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.86.up_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.86.up_proj.weight_scale_inv": "model-00139-of-000163.safetensors", "model.layers.53.mlp.experts.86.down_proj.weight": "model-00139-of-000163.safetensors", - "model.layers.53.mlp.experts.86.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.87.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.87.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.87.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.87.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.87.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.87.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.88.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.88.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.88.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.88.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.88.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.88.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.89.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.89.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.89.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.89.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.89.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.89.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.90.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.90.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.90.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.90.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.90.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.90.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.91.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.91.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.91.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.91.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.91.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.91.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.92.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.92.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.92.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.92.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.92.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.92.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.93.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.93.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.93.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.93.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.93.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.93.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.94.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.94.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.94.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.94.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.94.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.94.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.95.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.95.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.95.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.95.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.95.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.95.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.96.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.96.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.96.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.96.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.96.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.96.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.97.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.97.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.97.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.97.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.97.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.97.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.98.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.98.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.98.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.98.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.98.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.98.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.99.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.99.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.99.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.99.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.99.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.99.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.100.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.100.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.100.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.100.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.100.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.100.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.101.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.101.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.101.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.101.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.101.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.101.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.102.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.102.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.102.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.102.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.102.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.102.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.103.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.103.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.103.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.103.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.103.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.103.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.104.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.104.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.104.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.104.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.104.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.104.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.105.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.105.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.105.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.105.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.105.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.105.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.106.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.106.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.106.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.106.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.106.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.106.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.107.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.107.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.107.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.107.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.107.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.107.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.108.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.108.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.108.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.108.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.108.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.108.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.109.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.109.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.109.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.109.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.109.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.109.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.110.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.110.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.110.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.110.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.110.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.110.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.111.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.111.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.111.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.111.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.111.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.111.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.112.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.112.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.112.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.112.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.112.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.112.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.113.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.113.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.113.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.113.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.113.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.113.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.114.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.114.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.114.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.114.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.114.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.114.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.115.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.115.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.115.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.115.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.115.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.115.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.116.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.116.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.116.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.116.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.116.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.116.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.117.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.117.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.117.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.117.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.117.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.117.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.118.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.118.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.118.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.118.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.118.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.118.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.119.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.119.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.119.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.119.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.119.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.119.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.120.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.120.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.120.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.120.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.120.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.120.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.121.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.121.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.121.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.121.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.121.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.121.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.122.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.122.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.122.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.122.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.122.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.122.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.123.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.123.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.123.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.123.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.123.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.123.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.124.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.124.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.124.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.124.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.124.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.124.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.125.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.125.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.125.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.125.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.125.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.125.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.126.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.126.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.126.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.126.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.126.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.126.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.127.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.127.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.127.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.127.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.127.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.127.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.128.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.128.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.128.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.128.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.128.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.128.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.129.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.129.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.129.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.129.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.129.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.129.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.130.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.130.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.130.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.130.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.130.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.130.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.131.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.131.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.131.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.131.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.131.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.131.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.132.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.132.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.132.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.132.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.132.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.132.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.133.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.133.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.133.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.133.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.133.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.133.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.134.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.134.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.134.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.134.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.134.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.134.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.135.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.135.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.135.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.135.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.135.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.135.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.136.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.136.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.136.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.136.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.136.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.136.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.137.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.137.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.137.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.137.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.137.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.137.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.138.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.138.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.138.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.138.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.138.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.138.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.139.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.139.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.139.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.139.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.139.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.139.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.140.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.140.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.140.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.140.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.140.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.140.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.141.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.141.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.141.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.141.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.141.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.141.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.142.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.142.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.142.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.142.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.142.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.142.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.143.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.143.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.143.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.143.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.143.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.143.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.144.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.144.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.144.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.144.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.144.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.144.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.145.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.145.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.145.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.145.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.145.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.145.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.146.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.146.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.146.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.146.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.146.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.146.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.147.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.147.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.147.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.147.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.147.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.147.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.148.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.148.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.148.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.148.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.148.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.148.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.149.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.149.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.149.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.149.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.149.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.149.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.150.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.150.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.150.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.150.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.150.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.150.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.151.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.151.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.151.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.151.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.151.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.151.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.152.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.152.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.152.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.152.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.152.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.152.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.153.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.153.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.153.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.153.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.153.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.153.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.154.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.154.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.154.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.154.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.154.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.154.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.155.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.155.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.155.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.155.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.155.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.155.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.156.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.156.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.156.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.156.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.156.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.156.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.157.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.157.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.157.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.157.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.157.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.157.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.158.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.158.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.158.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.158.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.158.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.158.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.159.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.159.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.159.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.159.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.159.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.159.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.160.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.160.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.160.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.160.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.160.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.160.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.161.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.161.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.161.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.161.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.161.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.161.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.162.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.162.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.162.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.162.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.162.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.162.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.163.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.163.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.163.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.163.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.163.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.163.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.164.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.164.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.164.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.164.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.164.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.164.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.165.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.165.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.165.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.165.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.165.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.165.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.166.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.166.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.166.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.166.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.166.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.166.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.167.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.167.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.167.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.167.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.167.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.167.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.168.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.168.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.168.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.168.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.168.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.168.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.169.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.169.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.169.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.169.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.169.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.169.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.170.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.170.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.170.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.170.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.170.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.170.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.171.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.171.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.171.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.171.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.171.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.171.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.172.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.172.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.172.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.172.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.172.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.172.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.173.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.173.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.173.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.173.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.173.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.173.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.174.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.174.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.174.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.174.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.174.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.174.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.175.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.175.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.175.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.175.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.175.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.175.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.176.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.176.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.176.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.176.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.176.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.176.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.177.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.177.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.177.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.177.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.177.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.177.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.178.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.178.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.178.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.178.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.178.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.178.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.179.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.179.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.179.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.179.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.179.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.179.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.180.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.180.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.180.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.180.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.180.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.180.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.181.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.181.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.181.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.181.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.181.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.181.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.182.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.182.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.182.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.182.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.182.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.182.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.183.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.183.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.183.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.183.up_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.183.down_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.183.down_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.184.gate_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.184.gate_proj.weight_scale_inv": "model-00140-of-000163.safetensors", "model.layers.53.mlp.experts.184.up_proj.weight": "model-00140-of-000163.safetensors", - "model.layers.53.mlp.experts.184.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.184.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.184.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.185.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.185.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.185.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.185.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.185.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.185.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.186.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.186.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.186.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.186.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.186.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.186.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.187.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.187.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.187.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.187.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.187.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.187.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.188.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.188.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.188.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.188.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.188.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.188.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.189.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.189.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.189.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.189.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.189.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.189.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.190.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.190.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.190.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.190.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.190.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.190.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.191.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.191.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.191.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.191.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.191.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.191.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.192.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.192.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.192.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.192.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.192.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.192.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.193.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.193.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.193.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.193.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.193.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.193.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.194.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.194.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.194.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.194.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.194.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.194.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.195.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.195.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.195.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.195.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.195.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.195.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.196.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.196.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.196.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.196.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.196.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.196.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.197.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.197.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.197.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.197.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.197.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.197.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.198.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.198.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.198.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.198.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.198.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.198.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.199.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.199.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.199.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.199.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.199.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.199.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.200.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.200.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.200.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.200.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.200.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.200.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.201.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.201.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.201.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.201.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.201.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.201.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.202.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.202.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.202.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.202.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.202.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.202.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.203.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.203.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.203.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.203.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.203.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.203.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.204.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.204.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.204.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.204.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.204.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.204.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.205.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.205.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.205.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.205.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.205.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.205.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.206.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.206.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.206.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.206.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.206.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.206.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.207.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.207.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.207.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.207.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.207.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.207.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.208.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.208.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.208.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.208.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.208.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.208.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.209.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.209.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.209.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.209.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.209.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.209.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.210.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.210.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.210.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.210.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.210.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.210.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.211.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.211.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.211.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.211.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.211.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.211.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.212.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.212.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.212.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.212.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.212.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.212.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.213.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.213.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.213.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.213.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.213.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.213.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.214.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.214.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.214.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.214.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.214.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.214.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.215.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.215.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.215.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.215.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.215.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.215.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.216.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.216.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.216.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.216.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.216.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.216.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.217.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.217.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.217.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.217.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.217.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.217.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.218.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.218.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.218.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.218.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.218.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.218.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.219.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.219.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.219.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.219.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.219.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.219.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.220.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.220.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.220.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.220.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.220.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.220.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.221.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.221.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.221.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.221.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.221.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.221.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.222.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.222.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.222.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.222.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.222.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.222.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.223.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.223.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.223.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.223.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.223.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.223.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.224.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.224.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.224.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.224.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.224.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.224.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.225.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.225.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.225.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.225.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.225.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.225.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.226.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.226.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.226.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.226.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.226.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.226.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.227.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.227.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.227.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.227.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.227.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.227.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.228.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.228.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.228.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.228.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.228.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.228.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.229.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.229.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.229.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.229.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.229.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.229.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.230.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.230.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.230.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.230.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.230.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.230.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.231.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.231.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.231.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.231.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.231.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.231.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.232.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.232.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.232.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.232.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.232.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.232.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.233.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.233.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.233.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.233.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.233.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.233.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.234.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.234.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.234.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.234.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.234.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.234.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.235.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.235.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.235.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.235.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.235.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.235.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.236.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.236.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.236.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.236.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.236.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.236.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.237.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.237.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.237.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.237.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.237.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.237.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.238.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.238.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.238.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.238.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.238.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.238.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.239.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.239.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.239.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.239.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.239.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.239.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.240.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.240.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.240.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.240.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.240.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.240.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.241.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.241.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.241.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.241.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.241.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.241.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.242.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.242.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.242.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.242.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.242.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.242.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.243.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.243.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.243.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.243.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.243.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.243.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.244.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.244.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.244.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.244.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.244.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.244.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.245.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.245.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.245.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.245.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.245.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.245.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.246.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.246.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.246.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.246.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.246.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.246.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.247.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.247.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.247.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.247.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.247.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.247.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.248.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.248.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.248.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.248.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.248.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.248.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.249.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.249.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.249.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.249.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.249.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.249.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.250.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.250.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.250.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.250.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.250.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.250.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.251.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.251.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.251.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.251.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.251.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.251.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.252.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.252.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.252.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.252.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.252.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.252.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.253.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.253.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.253.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.253.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.253.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.253.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.254.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.254.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.254.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.254.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.254.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.254.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.255.gate_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.255.gate_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.255.up_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.255.up_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.mlp.experts.255.down_proj.weight": "model-00141-of-000163.safetensors", - "model.layers.53.mlp.experts.255.down_proj.weight_scale_inv": "model-00141-of-000163.safetensors", "model.layers.53.input_layernorm.weight": "model-00141-of-000163.safetensors", "model.layers.53.post_attention_layernorm.weight": "model-00141-of-000163.safetensors", "model.layers.54.self_attn.q_a_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.self_attn.q_a_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.q_a_layernorm.weight": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.q_b_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.self_attn.q_b_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.kv_a_proj_with_mqa.weight": "model-00142-of-000163.safetensors", - "model.layers.54.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.kv_a_layernorm.weight": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.kv_b_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.self_attn.kv_b_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.self_attn.o_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.self_attn.o_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.gate.weight": "model-00142-of-000163.safetensors", "model.layers.54.mlp.gate.e_score_correction_bias": "model-00142-of-000163.safetensors", "model.layers.54.mlp.shared_experts.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.shared_experts.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.shared_experts.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.shared_experts.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.shared_experts.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.0.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.0.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.0.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.0.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.0.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.0.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.1.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.1.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.1.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.1.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.1.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.1.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.2.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.2.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.2.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.2.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.2.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.2.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.3.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.3.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.3.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.3.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.3.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.3.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.4.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.4.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.4.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.4.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.4.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.4.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.5.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.5.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.5.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.5.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.5.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.5.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.6.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.6.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.6.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.6.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.6.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.6.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.7.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.7.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.7.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.7.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.7.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.7.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.8.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.8.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.8.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.8.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.8.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.8.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.9.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.9.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.9.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.9.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.9.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.9.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.10.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.10.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.10.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.10.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.10.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.10.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.11.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.11.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.11.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.11.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.11.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.11.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.12.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.12.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.12.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.12.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.12.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.12.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.13.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.13.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.13.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.13.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.13.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.13.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.14.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.14.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.14.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.14.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.14.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.14.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.15.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.15.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.15.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.15.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.15.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.15.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.16.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.16.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.16.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.16.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.16.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.16.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.17.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.17.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.17.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.17.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.17.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.17.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.18.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.18.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.18.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.18.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.18.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.18.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.19.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.19.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.19.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.19.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.19.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.19.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.20.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.20.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.20.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.20.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.20.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.20.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.21.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.21.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.21.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.21.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.21.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.21.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.22.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.22.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.22.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.22.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.22.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.22.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.23.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.23.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.23.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.23.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.23.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.23.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.24.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.24.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.24.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.24.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.24.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.24.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.25.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.25.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.25.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.25.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.25.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.25.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.26.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.26.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.26.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.26.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.26.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.26.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.27.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.27.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.27.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.27.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.27.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.27.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.28.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.28.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.28.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.28.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.28.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.28.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.29.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.29.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.29.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.29.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.29.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.29.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.30.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.30.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.30.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.30.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.30.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.30.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.31.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.31.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.31.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.31.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.31.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.31.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.32.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.32.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.32.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.32.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.32.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.32.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.33.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.33.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.33.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.33.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.33.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.33.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.34.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.34.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.34.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.34.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.34.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.34.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.35.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.35.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.35.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.35.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.35.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.35.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.36.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.36.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.36.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.36.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.36.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.36.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.37.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.37.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.37.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.37.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.37.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.37.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.38.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.38.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.38.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.38.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.38.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.38.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.39.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.39.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.39.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.39.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.39.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.39.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.40.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.40.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.40.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.40.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.40.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.40.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.41.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.41.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.41.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.41.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.41.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.41.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.42.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.42.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.42.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.42.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.42.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.42.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.43.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.43.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.43.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.43.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.43.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.43.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.44.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.44.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.44.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.44.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.44.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.44.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.45.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.45.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.45.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.45.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.45.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.45.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.46.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.46.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.46.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.46.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.46.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.46.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.47.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.47.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.47.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.47.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.47.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.47.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.48.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.48.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.48.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.48.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.48.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.48.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.49.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.49.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.49.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.49.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.49.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.49.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.50.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.50.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.50.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.50.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.50.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.50.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.51.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.51.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.51.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.51.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.51.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.51.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.52.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.52.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.52.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.52.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.52.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.52.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.53.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.53.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.53.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.53.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.53.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.53.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.54.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.54.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.54.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.54.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.54.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.54.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.55.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.55.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.55.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.55.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.55.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.55.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.56.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.56.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.56.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.56.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.56.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.56.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.57.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.57.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.57.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.57.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.57.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.57.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.58.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.58.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.58.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.58.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.58.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.58.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.59.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.59.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.59.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.59.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.59.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.59.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.60.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.60.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.60.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.60.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.60.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.60.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.61.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.61.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.61.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.61.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.61.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.61.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.62.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.62.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.62.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.62.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.62.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.62.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.63.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.63.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.63.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.63.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.63.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.63.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.64.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.64.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.64.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.64.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.64.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.64.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.65.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.65.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.65.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.65.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.65.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.65.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.66.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.66.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.66.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.66.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.66.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.66.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.67.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.67.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.67.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.67.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.67.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.67.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.68.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.68.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.68.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.68.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.68.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.68.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.69.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.69.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.69.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.69.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.69.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.69.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.70.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.70.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.70.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.70.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.70.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.70.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.71.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.71.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.71.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.71.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.71.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.71.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.72.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.72.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.72.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.72.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.72.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.72.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.73.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.73.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.73.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.73.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.73.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.73.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.74.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.74.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.74.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.74.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.74.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.74.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.75.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.75.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.75.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.75.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.75.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.75.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.76.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.76.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.76.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.76.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.76.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.76.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.77.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.77.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.77.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.77.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.77.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.77.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.78.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.78.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.78.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.78.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.78.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.78.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.79.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.79.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.79.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.79.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.79.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.79.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.80.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.80.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.80.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.80.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.80.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.80.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.81.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.81.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.81.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.81.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.81.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.81.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.82.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.82.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.82.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.82.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.82.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.82.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.83.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.83.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.83.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.83.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.83.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.83.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.84.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.84.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.84.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.84.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.84.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.84.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.85.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.85.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.85.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.85.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.85.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.85.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.86.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.86.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.86.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.86.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.86.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.86.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.87.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.87.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.87.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.87.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.87.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.87.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.88.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.88.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.88.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.88.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.88.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.88.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.89.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.89.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.89.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.89.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.89.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.89.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.90.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.90.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.90.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.90.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.90.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.90.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.91.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.91.gate_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.91.up_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.91.up_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.91.down_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.91.down_proj.weight_scale_inv": "model-00142-of-000163.safetensors", "model.layers.54.mlp.experts.92.gate_proj.weight": "model-00142-of-000163.safetensors", - "model.layers.54.mlp.experts.92.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.92.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.92.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.92.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.92.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.93.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.93.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.93.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.93.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.93.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.93.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.94.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.94.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.94.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.94.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.94.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.94.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.95.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.95.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.95.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.95.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.95.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.95.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.96.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.96.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.96.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.96.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.96.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.96.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.97.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.97.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.97.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.97.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.97.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.97.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.98.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.98.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.98.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.98.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.98.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.98.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.99.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.99.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.99.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.99.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.99.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.99.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.100.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.100.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.100.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.100.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.100.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.100.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.101.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.101.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.101.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.101.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.101.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.101.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.102.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.102.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.102.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.102.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.102.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.102.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.103.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.103.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.103.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.103.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.103.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.103.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.104.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.104.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.104.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.104.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.104.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.104.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.105.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.105.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.105.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.105.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.105.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.105.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.106.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.106.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.106.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.106.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.106.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.106.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.107.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.107.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.107.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.107.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.107.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.107.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.108.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.108.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.108.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.108.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.108.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.108.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.109.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.109.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.109.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.109.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.109.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.109.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.110.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.110.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.110.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.110.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.110.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.110.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.111.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.111.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.111.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.111.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.111.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.111.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.112.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.112.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.112.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.112.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.112.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.112.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.113.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.113.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.113.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.113.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.113.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.113.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.114.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.114.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.114.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.114.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.114.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.114.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.115.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.115.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.115.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.115.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.115.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.115.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.116.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.116.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.116.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.116.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.116.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.116.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.117.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.117.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.117.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.117.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.117.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.117.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.118.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.118.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.118.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.118.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.118.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.118.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.119.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.119.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.119.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.119.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.119.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.119.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.120.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.120.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.120.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.120.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.120.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.120.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.121.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.121.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.121.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.121.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.121.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.121.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.122.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.122.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.122.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.122.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.122.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.122.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.123.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.123.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.123.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.123.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.123.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.123.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.124.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.124.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.124.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.124.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.124.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.124.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.125.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.125.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.125.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.125.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.125.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.125.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.126.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.126.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.126.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.126.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.126.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.126.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.127.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.127.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.127.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.127.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.127.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.127.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.128.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.128.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.128.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.128.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.128.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.128.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.129.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.129.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.129.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.129.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.129.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.129.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.130.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.130.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.130.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.130.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.130.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.130.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.131.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.131.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.131.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.131.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.131.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.131.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.132.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.132.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.132.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.132.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.132.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.132.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.133.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.133.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.133.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.133.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.133.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.133.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.134.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.134.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.134.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.134.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.134.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.134.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.135.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.135.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.135.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.135.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.135.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.135.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.136.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.136.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.136.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.136.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.136.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.136.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.137.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.137.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.137.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.137.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.137.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.137.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.138.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.138.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.138.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.138.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.138.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.138.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.139.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.139.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.139.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.139.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.139.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.139.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.140.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.140.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.140.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.140.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.140.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.140.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.141.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.141.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.141.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.141.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.141.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.141.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.142.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.142.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.142.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.142.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.142.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.142.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.143.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.143.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.143.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.143.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.143.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.143.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.144.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.144.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.144.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.144.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.144.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.144.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.145.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.145.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.145.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.145.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.145.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.145.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.146.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.146.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.146.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.146.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.146.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.146.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.147.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.147.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.147.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.147.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.147.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.147.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.148.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.148.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.148.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.148.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.148.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.148.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.149.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.149.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.149.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.149.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.149.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.149.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.150.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.150.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.150.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.150.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.150.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.150.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.151.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.151.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.151.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.151.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.151.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.151.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.152.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.152.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.152.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.152.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.152.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.152.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.153.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.153.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.153.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.153.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.153.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.153.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.154.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.154.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.154.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.154.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.154.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.154.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.155.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.155.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.155.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.155.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.155.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.155.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.156.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.156.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.156.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.156.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.156.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.156.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.157.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.157.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.157.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.157.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.157.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.157.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.158.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.158.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.158.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.158.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.158.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.158.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.159.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.159.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.159.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.159.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.159.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.159.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.160.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.160.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.160.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.160.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.160.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.160.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.161.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.161.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.161.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.161.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.161.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.161.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.162.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.162.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.162.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.162.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.162.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.162.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.163.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.163.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.163.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.163.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.163.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.163.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.164.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.164.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.164.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.164.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.164.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.164.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.165.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.165.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.165.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.165.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.165.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.165.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.166.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.166.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.166.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.166.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.166.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.166.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.167.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.167.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.167.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.167.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.167.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.167.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.168.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.168.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.168.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.168.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.168.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.168.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.169.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.169.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.169.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.169.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.169.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.169.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.170.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.170.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.170.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.170.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.170.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.170.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.171.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.171.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.171.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.171.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.171.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.171.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.172.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.172.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.172.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.172.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.172.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.172.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.173.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.173.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.173.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.173.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.173.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.173.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.174.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.174.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.174.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.174.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.174.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.174.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.175.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.175.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.175.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.175.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.175.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.175.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.176.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.176.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.176.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.176.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.176.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.176.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.177.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.177.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.177.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.177.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.177.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.177.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.178.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.178.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.178.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.178.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.178.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.178.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.179.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.179.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.179.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.179.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.179.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.179.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.180.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.180.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.180.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.180.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.180.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.180.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.181.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.181.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.181.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.181.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.181.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.181.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.182.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.182.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.182.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.182.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.182.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.182.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.183.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.183.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.183.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.183.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.183.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.183.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.184.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.184.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.184.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.184.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.184.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.184.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.185.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.185.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.185.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.185.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.185.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.185.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.186.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.186.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.186.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.186.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.186.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.186.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.187.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.187.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.187.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.187.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.187.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.187.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.188.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.188.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.188.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.188.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.188.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.188.down_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.189.gate_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.189.gate_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.189.up_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.189.up_proj.weight_scale_inv": "model-00143-of-000163.safetensors", "model.layers.54.mlp.experts.189.down_proj.weight": "model-00143-of-000163.safetensors", - "model.layers.54.mlp.experts.189.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.190.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.190.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.190.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.190.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.190.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.190.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.191.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.191.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.191.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.191.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.191.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.191.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.192.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.192.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.192.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.192.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.192.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.192.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.193.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.193.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.193.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.193.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.193.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.193.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.194.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.194.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.194.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.194.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.194.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.194.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.195.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.195.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.195.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.195.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.195.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.195.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.196.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.196.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.196.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.196.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.196.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.196.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.197.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.197.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.197.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.197.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.197.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.197.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.198.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.198.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.198.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.198.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.198.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.198.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.199.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.199.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.199.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.199.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.199.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.199.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.200.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.200.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.200.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.200.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.200.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.200.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.201.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.201.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.201.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.201.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.201.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.201.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.202.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.202.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.202.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.202.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.202.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.202.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.203.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.203.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.203.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.203.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.203.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.203.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.204.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.204.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.204.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.204.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.204.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.204.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.205.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.205.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.205.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.205.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.205.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.205.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.206.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.206.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.206.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.206.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.206.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.206.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.207.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.207.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.207.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.207.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.207.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.207.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.208.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.208.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.208.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.208.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.208.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.208.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.209.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.209.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.209.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.209.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.209.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.209.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.210.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.210.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.210.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.210.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.210.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.210.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.211.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.211.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.211.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.211.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.211.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.211.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.212.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.212.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.212.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.212.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.212.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.212.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.213.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.213.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.213.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.213.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.213.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.213.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.214.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.214.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.214.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.214.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.214.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.214.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.215.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.215.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.215.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.215.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.215.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.215.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.216.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.216.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.216.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.216.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.216.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.216.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.217.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.217.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.217.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.217.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.217.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.217.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.218.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.218.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.218.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.218.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.218.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.218.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.219.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.219.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.219.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.219.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.219.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.219.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.220.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.220.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.220.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.220.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.220.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.220.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.221.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.221.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.221.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.221.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.221.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.221.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.222.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.222.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.222.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.222.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.222.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.222.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.223.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.223.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.223.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.223.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.223.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.223.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.224.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.224.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.224.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.224.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.224.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.224.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.225.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.225.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.225.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.225.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.225.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.225.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.226.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.226.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.226.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.226.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.226.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.226.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.227.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.227.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.227.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.227.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.227.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.227.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.228.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.228.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.228.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.228.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.228.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.228.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.229.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.229.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.229.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.229.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.229.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.229.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.230.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.230.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.230.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.230.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.230.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.230.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.231.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.231.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.231.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.231.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.231.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.231.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.232.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.232.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.232.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.232.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.232.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.232.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.233.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.233.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.233.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.233.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.233.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.233.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.234.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.234.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.234.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.234.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.234.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.234.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.235.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.235.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.235.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.235.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.235.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.235.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.236.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.236.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.236.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.236.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.236.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.236.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.237.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.237.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.237.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.237.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.237.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.237.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.238.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.238.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.238.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.238.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.238.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.238.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.239.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.239.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.239.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.239.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.239.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.239.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.240.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.240.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.240.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.240.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.240.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.240.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.241.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.241.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.241.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.241.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.241.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.241.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.242.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.242.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.242.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.242.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.242.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.242.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.243.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.243.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.243.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.243.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.243.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.243.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.244.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.244.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.244.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.244.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.244.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.244.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.245.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.245.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.245.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.245.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.245.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.245.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.246.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.246.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.246.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.246.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.246.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.246.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.247.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.247.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.247.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.247.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.247.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.247.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.248.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.248.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.248.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.248.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.248.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.248.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.249.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.249.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.249.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.249.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.249.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.249.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.250.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.250.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.250.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.250.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.250.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.250.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.251.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.251.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.251.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.251.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.251.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.251.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.252.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.252.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.252.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.252.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.252.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.252.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.253.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.253.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.253.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.253.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.253.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.253.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.254.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.254.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.254.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.254.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.254.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.254.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.255.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.255.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.255.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.255.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.mlp.experts.255.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.54.mlp.experts.255.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.54.input_layernorm.weight": "model-00144-of-000163.safetensors", "model.layers.54.post_attention_layernorm.weight": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.q_a_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.self_attn.q_a_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.q_a_layernorm.weight": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.q_b_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.self_attn.q_b_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.kv_a_proj_with_mqa.weight": "model-00144-of-000163.safetensors", - "model.layers.55.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.kv_a_layernorm.weight": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.kv_b_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.self_attn.kv_b_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.self_attn.o_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.self_attn.o_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.gate.weight": "model-00144-of-000163.safetensors", "model.layers.55.mlp.gate.e_score_correction_bias": "model-00144-of-000163.safetensors", "model.layers.55.mlp.shared_experts.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.shared_experts.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.shared_experts.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.shared_experts.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.shared_experts.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.0.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.0.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.0.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.0.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.0.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.0.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.1.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.1.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.1.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.1.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.1.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.1.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.2.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.2.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.2.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.2.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.2.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.2.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.3.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.3.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.3.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.3.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.3.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.3.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.4.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.4.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.4.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.4.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.4.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.4.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.5.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.5.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.5.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.5.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.5.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.5.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.6.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.6.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.6.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.6.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.6.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.6.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.7.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.7.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.7.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.7.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.7.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.7.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.8.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.8.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.8.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.8.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.8.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.8.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.9.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.9.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.9.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.9.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.9.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.9.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.10.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.10.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.10.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.10.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.10.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.10.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.11.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.11.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.11.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.11.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.11.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.11.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.12.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.12.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.12.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.12.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.12.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.12.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.13.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.13.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.13.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.13.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.13.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.13.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.14.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.14.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.14.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.14.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.14.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.14.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.15.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.15.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.15.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.15.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.15.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.15.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.16.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.16.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.16.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.16.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.16.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.16.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.17.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.17.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.17.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.17.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.17.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.17.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.18.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.18.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.18.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.18.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.18.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.18.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.19.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.19.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.19.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.19.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.19.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.19.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.20.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.20.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.20.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.20.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.20.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.20.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.21.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.21.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.21.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.21.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.21.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.21.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.22.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.22.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.22.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.22.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.22.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.22.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.23.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.23.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.23.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.23.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.23.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.23.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.24.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.24.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.24.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.24.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.24.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.24.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.25.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.25.gate_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.25.up_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.25.up_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.25.down_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.25.down_proj.weight_scale_inv": "model-00144-of-000163.safetensors", "model.layers.55.mlp.experts.26.gate_proj.weight": "model-00144-of-000163.safetensors", - "model.layers.55.mlp.experts.26.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.26.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.26.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.26.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.26.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.27.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.27.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.27.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.27.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.27.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.27.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.28.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.28.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.28.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.28.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.28.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.28.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.29.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.29.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.29.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.29.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.29.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.29.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.30.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.30.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.30.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.30.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.30.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.30.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.31.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.31.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.31.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.31.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.31.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.31.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.32.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.32.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.32.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.32.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.32.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.32.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.33.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.33.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.33.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.33.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.33.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.33.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.34.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.34.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.34.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.34.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.34.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.34.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.35.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.35.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.35.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.35.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.35.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.35.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.36.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.36.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.36.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.36.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.36.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.36.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.37.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.37.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.37.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.37.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.37.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.37.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.38.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.38.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.38.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.38.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.38.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.38.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.39.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.39.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.39.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.39.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.39.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.39.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.40.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.40.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.40.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.40.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.40.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.40.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.41.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.41.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.41.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.41.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.41.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.41.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.42.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.42.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.42.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.42.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.42.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.42.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.43.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.43.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.43.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.43.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.43.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.43.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.44.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.44.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.44.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.44.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.44.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.44.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.45.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.45.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.45.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.45.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.45.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.45.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.46.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.46.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.46.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.46.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.46.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.46.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.47.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.47.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.47.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.47.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.47.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.47.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.48.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.48.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.48.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.48.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.48.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.48.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.49.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.49.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.49.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.49.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.49.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.49.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.50.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.50.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.50.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.50.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.50.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.50.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.51.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.51.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.51.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.51.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.51.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.51.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.52.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.52.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.52.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.52.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.52.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.52.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.53.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.53.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.53.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.53.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.53.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.53.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.54.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.54.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.54.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.54.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.54.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.54.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.55.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.55.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.55.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.55.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.55.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.55.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.56.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.56.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.56.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.56.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.56.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.56.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.57.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.57.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.57.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.57.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.57.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.57.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.58.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.58.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.58.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.58.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.58.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.58.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.59.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.59.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.59.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.59.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.59.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.59.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.60.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.60.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.60.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.60.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.60.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.60.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.61.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.61.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.61.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.61.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.61.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.61.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.62.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.62.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.62.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.62.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.62.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.62.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.63.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.63.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.63.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.63.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.63.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.63.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.64.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.64.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.64.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.64.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.64.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.64.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.65.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.65.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.65.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.65.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.65.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.65.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.66.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.66.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.66.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.66.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.66.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.66.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.67.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.67.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.67.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.67.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.67.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.67.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.68.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.68.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.68.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.68.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.68.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.68.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.69.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.69.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.69.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.69.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.69.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.69.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.70.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.70.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.70.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.70.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.70.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.70.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.71.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.71.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.71.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.71.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.71.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.71.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.72.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.72.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.72.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.72.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.72.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.72.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.73.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.73.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.73.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.73.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.73.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.73.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.74.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.74.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.74.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.74.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.74.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.74.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.75.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.75.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.75.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.75.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.75.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.75.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.76.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.76.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.76.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.76.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.76.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.76.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.77.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.77.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.77.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.77.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.77.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.77.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.78.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.78.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.78.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.78.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.78.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.78.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.79.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.79.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.79.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.79.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.79.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.79.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.80.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.80.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.80.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.80.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.80.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.80.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.81.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.81.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.81.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.81.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.81.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.81.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.82.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.82.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.82.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.82.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.82.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.82.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.83.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.83.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.83.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.83.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.83.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.83.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.84.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.84.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.84.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.84.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.84.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.84.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.85.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.85.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.85.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.85.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.85.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.85.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.86.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.86.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.86.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.86.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.86.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.86.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.87.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.87.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.87.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.87.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.87.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.87.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.88.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.88.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.88.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.88.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.88.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.88.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.89.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.89.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.89.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.89.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.89.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.89.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.90.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.90.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.90.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.90.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.90.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.90.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.91.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.91.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.91.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.91.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.91.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.91.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.92.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.92.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.92.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.92.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.92.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.92.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.93.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.93.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.93.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.93.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.93.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.93.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.94.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.94.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.94.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.94.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.94.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.94.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.95.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.95.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.95.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.95.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.95.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.95.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.96.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.96.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.96.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.96.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.96.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.96.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.97.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.97.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.97.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.97.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.97.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.97.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.98.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.98.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.98.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.98.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.98.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.98.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.99.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.99.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.99.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.99.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.99.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.99.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.100.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.100.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.100.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.100.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.100.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.100.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.101.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.101.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.101.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.101.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.101.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.101.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.102.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.102.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.102.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.102.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.102.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.102.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.103.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.103.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.103.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.103.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.103.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.103.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.104.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.104.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.104.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.104.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.104.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.104.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.105.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.105.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.105.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.105.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.105.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.105.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.106.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.106.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.106.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.106.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.106.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.106.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.107.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.107.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.107.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.107.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.107.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.107.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.108.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.108.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.108.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.108.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.108.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.108.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.109.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.109.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.109.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.109.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.109.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.109.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.110.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.110.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.110.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.110.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.110.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.110.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.111.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.111.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.111.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.111.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.111.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.111.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.112.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.112.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.112.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.112.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.112.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.112.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.113.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.113.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.113.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.113.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.113.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.113.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.114.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.114.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.114.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.114.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.114.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.114.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.115.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.115.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.115.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.115.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.115.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.115.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.116.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.116.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.116.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.116.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.116.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.116.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.117.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.117.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.117.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.117.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.117.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.117.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.118.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.118.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.118.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.118.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.118.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.118.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.119.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.119.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.119.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.119.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.119.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.119.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.120.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.120.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.120.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.120.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.120.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.120.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.121.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.121.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.121.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.121.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.121.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.121.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.122.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.122.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.122.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.122.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.122.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.122.down_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.123.gate_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.123.gate_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.123.up_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.123.up_proj.weight_scale_inv": "model-00145-of-000163.safetensors", "model.layers.55.mlp.experts.123.down_proj.weight": "model-00145-of-000163.safetensors", - "model.layers.55.mlp.experts.123.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.124.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.124.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.124.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.124.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.124.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.124.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.125.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.125.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.125.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.125.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.125.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.125.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.126.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.126.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.126.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.126.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.126.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.126.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.127.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.127.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.127.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.127.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.127.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.127.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.128.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.128.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.128.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.128.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.128.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.128.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.129.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.129.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.129.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.129.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.129.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.129.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.130.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.130.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.130.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.130.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.130.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.130.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.131.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.131.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.131.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.131.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.131.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.131.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.132.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.132.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.132.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.132.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.132.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.132.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.133.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.133.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.133.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.133.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.133.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.133.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.134.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.134.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.134.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.134.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.134.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.134.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.135.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.135.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.135.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.135.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.135.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.135.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.136.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.136.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.136.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.136.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.136.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.136.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.137.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.137.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.137.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.137.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.137.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.137.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.138.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.138.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.138.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.138.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.138.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.138.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.139.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.139.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.139.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.139.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.139.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.139.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.140.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.140.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.140.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.140.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.140.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.140.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.141.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.141.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.141.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.141.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.141.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.141.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.142.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.142.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.142.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.142.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.142.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.142.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.143.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.143.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.143.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.143.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.143.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.143.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.144.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.144.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.144.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.144.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.144.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.144.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.145.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.145.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.145.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.145.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.145.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.145.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.146.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.146.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.146.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.146.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.146.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.146.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.147.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.147.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.147.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.147.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.147.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.147.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.148.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.148.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.148.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.148.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.148.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.148.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.149.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.149.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.149.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.149.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.149.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.149.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.150.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.150.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.150.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.150.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.150.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.150.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.151.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.151.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.151.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.151.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.151.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.151.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.152.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.152.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.152.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.152.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.152.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.152.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.153.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.153.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.153.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.153.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.153.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.153.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.154.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.154.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.154.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.154.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.154.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.154.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.155.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.155.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.155.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.155.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.155.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.155.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.156.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.156.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.156.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.156.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.156.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.156.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.157.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.157.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.157.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.157.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.157.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.157.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.158.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.158.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.158.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.158.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.158.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.158.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.159.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.159.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.159.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.159.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.159.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.159.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.160.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.160.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.160.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.160.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.160.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.160.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.161.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.161.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.161.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.161.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.161.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.161.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.162.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.162.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.162.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.162.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.162.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.162.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.163.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.163.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.163.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.163.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.163.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.163.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.164.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.164.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.164.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.164.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.164.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.164.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.165.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.165.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.165.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.165.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.165.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.165.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.166.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.166.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.166.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.166.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.166.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.166.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.167.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.167.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.167.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.167.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.167.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.167.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.168.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.168.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.168.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.168.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.168.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.168.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.169.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.169.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.169.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.169.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.169.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.169.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.170.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.170.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.170.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.170.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.170.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.170.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.171.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.171.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.171.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.171.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.171.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.171.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.172.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.172.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.172.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.172.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.172.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.172.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.173.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.173.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.173.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.173.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.173.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.173.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.174.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.174.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.174.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.174.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.174.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.174.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.175.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.175.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.175.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.175.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.175.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.175.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.176.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.176.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.176.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.176.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.176.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.176.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.177.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.177.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.177.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.177.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.177.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.177.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.178.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.178.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.178.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.178.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.178.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.178.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.179.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.179.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.179.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.179.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.179.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.179.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.180.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.180.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.180.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.180.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.180.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.180.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.181.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.181.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.181.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.181.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.181.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.181.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.182.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.182.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.182.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.182.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.182.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.182.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.183.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.183.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.183.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.183.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.183.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.183.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.184.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.184.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.184.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.184.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.184.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.184.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.185.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.185.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.185.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.185.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.185.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.185.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.186.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.186.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.186.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.186.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.186.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.186.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.187.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.187.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.187.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.187.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.187.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.187.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.188.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.188.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.188.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.188.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.188.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.188.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.189.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.189.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.189.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.189.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.189.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.189.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.190.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.190.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.190.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.190.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.190.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.190.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.191.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.191.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.191.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.191.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.191.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.191.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.192.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.192.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.192.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.192.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.192.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.192.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.193.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.193.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.193.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.193.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.193.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.193.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.194.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.194.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.194.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.194.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.194.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.194.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.195.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.195.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.195.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.195.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.195.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.195.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.196.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.196.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.196.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.196.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.196.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.196.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.197.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.197.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.197.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.197.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.197.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.197.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.198.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.198.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.198.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.198.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.198.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.198.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.199.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.199.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.199.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.199.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.199.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.199.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.200.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.200.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.200.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.200.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.200.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.200.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.201.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.201.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.201.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.201.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.201.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.201.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.202.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.202.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.202.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.202.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.202.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.202.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.203.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.203.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.203.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.203.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.203.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.203.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.204.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.204.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.204.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.204.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.204.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.204.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.205.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.205.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.205.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.205.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.205.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.205.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.206.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.206.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.206.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.206.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.206.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.206.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.207.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.207.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.207.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.207.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.207.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.207.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.208.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.208.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.208.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.208.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.208.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.208.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.209.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.209.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.209.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.209.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.209.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.209.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.210.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.210.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.210.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.210.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.210.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.210.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.211.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.211.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.211.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.211.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.211.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.211.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.212.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.212.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.212.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.212.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.212.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.212.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.213.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.213.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.213.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.213.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.213.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.213.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.214.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.214.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.214.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.214.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.214.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.214.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.215.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.215.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.215.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.215.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.215.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.215.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.216.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.216.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.216.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.216.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.216.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.216.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.217.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.217.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.217.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.217.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.217.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.217.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.218.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.218.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.218.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.218.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.218.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.218.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.219.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.219.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.219.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.219.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.219.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.219.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.220.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.220.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.220.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.220.up_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.220.down_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.220.down_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.221.gate_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.221.gate_proj.weight_scale_inv": "model-00146-of-000163.safetensors", "model.layers.55.mlp.experts.221.up_proj.weight": "model-00146-of-000163.safetensors", - "model.layers.55.mlp.experts.221.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.221.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.221.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.222.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.222.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.222.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.222.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.222.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.222.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.223.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.223.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.223.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.223.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.223.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.223.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.224.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.224.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.224.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.224.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.224.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.224.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.225.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.225.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.225.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.225.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.225.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.225.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.226.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.226.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.226.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.226.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.226.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.226.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.227.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.227.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.227.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.227.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.227.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.227.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.228.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.228.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.228.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.228.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.228.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.228.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.229.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.229.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.229.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.229.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.229.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.229.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.230.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.230.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.230.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.230.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.230.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.230.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.231.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.231.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.231.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.231.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.231.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.231.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.232.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.232.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.232.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.232.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.232.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.232.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.233.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.233.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.233.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.233.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.233.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.233.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.234.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.234.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.234.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.234.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.234.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.234.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.235.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.235.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.235.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.235.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.235.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.235.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.236.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.236.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.236.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.236.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.236.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.236.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.237.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.237.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.237.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.237.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.237.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.237.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.238.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.238.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.238.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.238.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.238.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.238.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.239.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.239.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.239.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.239.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.239.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.239.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.240.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.240.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.240.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.240.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.240.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.240.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.241.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.241.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.241.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.241.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.241.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.241.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.242.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.242.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.242.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.242.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.242.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.242.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.243.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.243.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.243.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.243.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.243.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.243.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.244.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.244.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.244.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.244.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.244.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.244.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.245.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.245.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.245.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.245.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.245.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.245.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.246.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.246.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.246.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.246.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.246.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.246.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.247.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.247.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.247.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.247.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.247.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.247.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.248.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.248.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.248.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.248.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.248.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.248.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.249.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.249.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.249.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.249.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.249.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.249.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.250.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.250.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.250.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.250.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.250.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.250.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.251.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.251.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.251.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.251.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.251.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.251.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.252.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.252.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.252.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.252.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.252.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.252.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.253.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.253.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.253.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.253.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.253.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.253.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.254.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.254.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.254.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.254.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.254.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.254.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.255.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.255.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.255.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.255.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.mlp.experts.255.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.55.mlp.experts.255.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.55.input_layernorm.weight": "model-00147-of-000163.safetensors", "model.layers.55.post_attention_layernorm.weight": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.q_a_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.self_attn.q_a_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.q_a_layernorm.weight": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.q_b_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.self_attn.q_b_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.kv_a_proj_with_mqa.weight": "model-00147-of-000163.safetensors", - "model.layers.56.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.kv_a_layernorm.weight": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.kv_b_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.self_attn.kv_b_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.self_attn.o_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.self_attn.o_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.gate.weight": "model-00147-of-000163.safetensors", "model.layers.56.mlp.gate.e_score_correction_bias": "model-00147-of-000163.safetensors", "model.layers.56.mlp.shared_experts.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.shared_experts.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.shared_experts.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.shared_experts.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.shared_experts.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.0.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.0.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.0.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.0.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.0.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.0.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.1.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.1.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.1.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.1.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.1.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.1.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.2.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.2.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.2.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.2.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.2.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.2.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.3.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.3.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.3.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.3.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.3.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.3.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.4.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.4.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.4.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.4.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.4.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.4.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.5.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.5.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.5.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.5.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.5.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.5.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.6.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.6.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.6.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.6.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.6.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.6.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.7.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.7.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.7.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.7.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.7.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.7.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.8.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.8.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.8.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.8.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.8.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.8.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.9.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.9.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.9.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.9.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.9.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.9.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.10.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.10.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.10.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.10.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.10.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.10.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.11.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.11.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.11.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.11.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.11.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.11.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.12.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.12.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.12.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.12.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.12.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.12.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.13.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.13.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.13.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.13.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.13.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.13.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.14.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.14.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.14.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.14.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.14.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.14.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.15.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.15.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.15.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.15.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.15.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.15.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.16.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.16.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.16.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.16.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.16.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.16.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.17.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.17.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.17.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.17.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.17.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.17.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.18.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.18.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.18.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.18.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.18.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.18.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.19.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.19.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.19.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.19.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.19.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.19.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.20.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.20.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.20.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.20.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.20.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.20.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.21.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.21.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.21.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.21.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.21.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.21.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.22.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.22.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.22.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.22.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.22.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.22.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.23.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.23.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.23.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.23.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.23.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.23.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.24.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.24.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.24.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.24.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.24.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.24.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.25.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.25.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.25.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.25.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.25.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.25.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.26.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.26.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.26.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.26.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.26.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.26.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.27.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.27.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.27.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.27.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.27.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.27.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.28.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.28.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.28.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.28.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.28.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.28.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.29.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.29.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.29.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.29.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.29.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.29.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.30.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.30.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.30.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.30.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.30.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.30.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.31.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.31.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.31.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.31.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.31.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.31.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.32.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.32.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.32.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.32.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.32.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.32.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.33.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.33.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.33.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.33.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.33.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.33.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.34.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.34.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.34.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.34.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.34.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.34.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.35.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.35.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.35.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.35.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.35.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.35.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.36.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.36.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.36.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.36.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.36.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.36.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.37.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.37.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.37.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.37.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.37.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.37.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.38.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.38.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.38.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.38.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.38.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.38.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.39.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.39.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.39.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.39.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.39.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.39.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.40.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.40.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.40.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.40.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.40.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.40.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.41.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.41.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.41.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.41.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.41.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.41.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.42.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.42.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.42.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.42.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.42.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.42.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.43.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.43.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.43.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.43.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.43.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.43.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.44.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.44.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.44.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.44.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.44.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.44.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.45.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.45.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.45.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.45.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.45.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.45.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.46.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.46.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.46.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.46.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.46.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.46.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.47.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.47.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.47.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.47.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.47.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.47.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.48.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.48.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.48.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.48.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.48.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.48.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.49.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.49.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.49.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.49.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.49.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.49.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.50.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.50.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.50.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.50.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.50.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.50.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.51.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.51.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.51.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.51.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.51.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.51.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.52.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.52.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.52.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.52.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.52.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.52.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.53.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.53.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.53.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.53.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.53.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.53.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.54.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.54.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.54.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.54.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.54.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.54.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.55.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.55.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.55.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.55.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.55.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.55.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.56.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.56.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.56.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.56.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.56.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.56.down_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.57.gate_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.57.gate_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.57.up_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.57.up_proj.weight_scale_inv": "model-00147-of-000163.safetensors", "model.layers.56.mlp.experts.57.down_proj.weight": "model-00147-of-000163.safetensors", - "model.layers.56.mlp.experts.57.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.58.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.58.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.58.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.58.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.58.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.58.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.59.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.59.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.59.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.59.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.59.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.59.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.60.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.60.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.60.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.60.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.60.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.60.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.61.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.61.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.61.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.61.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.61.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.61.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.62.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.62.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.62.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.62.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.62.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.62.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.63.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.63.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.63.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.63.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.63.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.63.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.64.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.64.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.64.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.64.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.64.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.64.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.65.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.65.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.65.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.65.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.65.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.65.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.66.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.66.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.66.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.66.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.66.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.66.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.67.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.67.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.67.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.67.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.67.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.67.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.68.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.68.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.68.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.68.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.68.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.68.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.69.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.69.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.69.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.69.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.69.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.69.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.70.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.70.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.70.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.70.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.70.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.70.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.71.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.71.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.71.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.71.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.71.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.71.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.72.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.72.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.72.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.72.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.72.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.72.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.73.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.73.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.73.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.73.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.73.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.73.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.74.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.74.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.74.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.74.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.74.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.74.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.75.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.75.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.75.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.75.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.75.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.75.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.76.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.76.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.76.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.76.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.76.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.76.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.77.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.77.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.77.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.77.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.77.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.77.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.78.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.78.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.78.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.78.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.78.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.78.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.79.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.79.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.79.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.79.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.79.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.79.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.80.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.80.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.80.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.80.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.80.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.80.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.81.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.81.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.81.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.81.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.81.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.81.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.82.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.82.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.82.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.82.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.82.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.82.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.83.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.83.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.83.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.83.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.83.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.83.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.84.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.84.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.84.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.84.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.84.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.84.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.85.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.85.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.85.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.85.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.85.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.85.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.86.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.86.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.86.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.86.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.86.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.86.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.87.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.87.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.87.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.87.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.87.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.87.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.88.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.88.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.88.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.88.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.88.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.88.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.89.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.89.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.89.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.89.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.89.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.89.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.90.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.90.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.90.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.90.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.90.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.90.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.91.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.91.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.91.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.91.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.91.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.91.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.92.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.92.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.92.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.92.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.92.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.92.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.93.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.93.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.93.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.93.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.93.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.93.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.94.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.94.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.94.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.94.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.94.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.94.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.95.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.95.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.95.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.95.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.95.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.95.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.96.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.96.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.96.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.96.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.96.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.96.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.97.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.97.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.97.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.97.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.97.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.97.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.98.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.98.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.98.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.98.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.98.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.98.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.99.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.99.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.99.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.99.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.99.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.99.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.100.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.100.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.100.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.100.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.100.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.100.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.101.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.101.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.101.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.101.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.101.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.101.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.102.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.102.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.102.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.102.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.102.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.102.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.103.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.103.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.103.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.103.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.103.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.103.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.104.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.104.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.104.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.104.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.104.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.104.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.105.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.105.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.105.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.105.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.105.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.105.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.106.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.106.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.106.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.106.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.106.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.106.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.107.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.107.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.107.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.107.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.107.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.107.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.108.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.108.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.108.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.108.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.108.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.108.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.109.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.109.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.109.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.109.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.109.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.109.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.110.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.110.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.110.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.110.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.110.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.110.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.111.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.111.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.111.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.111.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.111.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.111.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.112.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.112.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.112.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.112.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.112.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.112.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.113.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.113.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.113.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.113.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.113.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.113.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.114.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.114.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.114.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.114.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.114.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.114.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.115.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.115.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.115.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.115.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.115.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.115.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.116.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.116.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.116.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.116.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.116.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.116.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.117.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.117.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.117.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.117.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.117.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.117.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.118.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.118.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.118.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.118.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.118.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.118.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.119.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.119.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.119.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.119.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.119.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.119.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.120.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.120.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.120.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.120.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.120.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.120.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.121.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.121.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.121.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.121.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.121.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.121.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.122.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.122.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.122.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.122.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.122.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.122.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.123.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.123.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.123.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.123.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.123.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.123.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.124.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.124.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.124.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.124.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.124.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.124.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.125.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.125.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.125.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.125.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.125.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.125.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.126.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.126.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.126.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.126.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.126.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.126.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.127.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.127.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.127.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.127.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.127.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.127.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.128.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.128.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.128.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.128.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.128.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.128.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.129.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.129.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.129.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.129.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.129.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.129.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.130.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.130.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.130.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.130.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.130.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.130.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.131.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.131.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.131.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.131.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.131.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.131.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.132.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.132.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.132.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.132.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.132.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.132.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.133.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.133.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.133.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.133.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.133.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.133.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.134.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.134.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.134.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.134.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.134.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.134.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.135.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.135.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.135.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.135.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.135.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.135.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.136.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.136.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.136.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.136.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.136.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.136.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.137.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.137.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.137.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.137.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.137.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.137.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.138.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.138.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.138.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.138.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.138.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.138.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.139.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.139.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.139.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.139.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.139.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.139.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.140.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.140.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.140.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.140.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.140.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.140.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.141.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.141.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.141.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.141.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.141.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.141.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.142.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.142.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.142.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.142.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.142.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.142.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.143.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.143.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.143.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.143.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.143.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.143.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.144.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.144.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.144.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.144.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.144.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.144.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.145.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.145.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.145.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.145.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.145.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.145.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.146.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.146.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.146.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.146.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.146.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.146.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.147.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.147.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.147.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.147.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.147.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.147.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.148.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.148.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.148.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.148.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.148.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.148.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.149.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.149.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.149.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.149.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.149.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.149.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.150.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.150.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.150.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.150.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.150.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.150.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.151.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.151.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.151.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.151.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.151.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.151.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.152.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.152.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.152.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.152.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.152.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.152.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.153.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.153.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.153.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.153.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.153.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.153.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.154.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.154.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.154.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.154.up_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.154.down_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.154.down_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.155.gate_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.155.gate_proj.weight_scale_inv": "model-00148-of-000163.safetensors", "model.layers.56.mlp.experts.155.up_proj.weight": "model-00148-of-000163.safetensors", - "model.layers.56.mlp.experts.155.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.155.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.155.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.156.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.156.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.156.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.156.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.156.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.156.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.157.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.157.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.157.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.157.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.157.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.157.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.158.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.158.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.158.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.158.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.158.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.158.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.159.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.159.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.159.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.159.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.159.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.159.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.160.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.160.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.160.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.160.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.160.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.160.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.161.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.161.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.161.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.161.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.161.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.161.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.162.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.162.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.162.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.162.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.162.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.162.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.163.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.163.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.163.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.163.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.163.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.163.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.164.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.164.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.164.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.164.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.164.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.164.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.165.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.165.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.165.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.165.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.165.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.165.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.166.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.166.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.166.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.166.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.166.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.166.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.167.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.167.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.167.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.167.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.167.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.167.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.168.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.168.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.168.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.168.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.168.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.168.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.169.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.169.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.169.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.169.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.169.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.169.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.170.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.170.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.170.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.170.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.170.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.170.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.171.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.171.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.171.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.171.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.171.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.171.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.172.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.172.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.172.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.172.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.172.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.172.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.173.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.173.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.173.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.173.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.173.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.173.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.174.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.174.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.174.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.174.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.174.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.174.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.175.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.175.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.175.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.175.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.175.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.175.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.176.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.176.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.176.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.176.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.176.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.176.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.177.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.177.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.177.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.177.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.177.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.177.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.178.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.178.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.178.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.178.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.178.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.178.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.179.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.179.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.179.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.179.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.179.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.179.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.180.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.180.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.180.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.180.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.180.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.180.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.181.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.181.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.181.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.181.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.181.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.181.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.182.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.182.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.182.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.182.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.182.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.182.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.183.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.183.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.183.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.183.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.183.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.183.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.184.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.184.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.184.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.184.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.184.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.184.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.185.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.185.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.185.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.185.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.185.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.185.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.186.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.186.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.186.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.186.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.186.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.186.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.187.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.187.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.187.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.187.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.187.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.187.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.188.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.188.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.188.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.188.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.188.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.188.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.189.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.189.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.189.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.189.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.189.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.189.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.190.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.190.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.190.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.190.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.190.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.190.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.191.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.191.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.191.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.191.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.191.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.191.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.192.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.192.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.192.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.192.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.192.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.192.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.193.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.193.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.193.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.193.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.193.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.193.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.194.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.194.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.194.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.194.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.194.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.194.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.195.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.195.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.195.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.195.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.195.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.195.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.196.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.196.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.196.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.196.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.196.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.196.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.197.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.197.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.197.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.197.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.197.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.197.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.198.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.198.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.198.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.198.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.198.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.198.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.199.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.199.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.199.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.199.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.199.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.199.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.200.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.200.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.200.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.200.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.200.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.200.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.201.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.201.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.201.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.201.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.201.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.201.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.202.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.202.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.202.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.202.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.202.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.202.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.203.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.203.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.203.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.203.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.203.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.203.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.204.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.204.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.204.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.204.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.204.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.204.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.205.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.205.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.205.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.205.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.205.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.205.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.206.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.206.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.206.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.206.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.206.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.206.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.207.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.207.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.207.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.207.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.207.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.207.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.208.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.208.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.208.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.208.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.208.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.208.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.209.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.209.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.209.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.209.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.209.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.209.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.210.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.210.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.210.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.210.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.210.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.210.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.211.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.211.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.211.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.211.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.211.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.211.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.212.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.212.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.212.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.212.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.212.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.212.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.213.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.213.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.213.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.213.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.213.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.213.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.214.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.214.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.214.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.214.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.214.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.214.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.215.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.215.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.215.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.215.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.215.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.215.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.216.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.216.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.216.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.216.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.216.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.216.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.217.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.217.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.217.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.217.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.217.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.217.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.218.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.218.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.218.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.218.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.218.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.218.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.219.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.219.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.219.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.219.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.219.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.219.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.220.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.220.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.220.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.220.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.220.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.220.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.221.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.221.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.221.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.221.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.221.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.221.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.222.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.222.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.222.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.222.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.222.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.222.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.223.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.223.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.223.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.223.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.223.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.223.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.224.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.224.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.224.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.224.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.224.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.224.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.225.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.225.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.225.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.225.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.225.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.225.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.226.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.226.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.226.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.226.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.226.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.226.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.227.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.227.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.227.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.227.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.227.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.227.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.228.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.228.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.228.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.228.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.228.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.228.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.229.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.229.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.229.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.229.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.229.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.229.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.230.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.230.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.230.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.230.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.230.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.230.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.231.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.231.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.231.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.231.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.231.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.231.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.232.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.232.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.232.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.232.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.232.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.232.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.233.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.233.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.233.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.233.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.233.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.233.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.234.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.234.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.234.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.234.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.234.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.234.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.235.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.235.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.235.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.235.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.235.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.235.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.236.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.236.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.236.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.236.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.236.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.236.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.237.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.237.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.237.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.237.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.237.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.237.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.238.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.238.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.238.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.238.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.238.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.238.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.239.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.239.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.239.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.239.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.239.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.239.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.240.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.240.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.240.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.240.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.240.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.240.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.241.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.241.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.241.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.241.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.241.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.241.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.242.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.242.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.242.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.242.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.242.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.242.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.243.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.243.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.243.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.243.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.243.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.243.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.244.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.244.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.244.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.244.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.244.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.244.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.245.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.245.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.245.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.245.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.245.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.245.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.246.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.246.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.246.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.246.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.246.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.246.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.247.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.247.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.247.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.247.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.247.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.247.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.248.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.248.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.248.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.248.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.248.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.248.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.249.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.249.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.249.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.249.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.249.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.249.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.250.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.250.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.250.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.250.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.250.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.250.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.251.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.251.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.251.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.251.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.251.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.251.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.252.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.252.gate_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.252.up_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.252.up_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.252.down_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.252.down_proj.weight_scale_inv": "model-00149-of-000163.safetensors", "model.layers.56.mlp.experts.253.gate_proj.weight": "model-00149-of-000163.safetensors", - "model.layers.56.mlp.experts.253.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.253.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.253.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.253.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.253.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.254.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.254.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.254.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.254.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.254.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.254.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.255.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.255.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.255.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.255.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.mlp.experts.255.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.56.mlp.experts.255.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.56.input_layernorm.weight": "model-00150-of-000163.safetensors", "model.layers.56.post_attention_layernorm.weight": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.q_a_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.self_attn.q_a_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.q_a_layernorm.weight": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.q_b_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.self_attn.q_b_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.kv_a_proj_with_mqa.weight": "model-00150-of-000163.safetensors", - "model.layers.57.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.kv_a_layernorm.weight": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.kv_b_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.self_attn.kv_b_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.self_attn.o_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.self_attn.o_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.gate.weight": "model-00150-of-000163.safetensors", "model.layers.57.mlp.gate.e_score_correction_bias": "model-00150-of-000163.safetensors", "model.layers.57.mlp.shared_experts.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.shared_experts.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.shared_experts.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.shared_experts.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.shared_experts.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.0.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.0.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.0.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.0.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.0.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.0.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.1.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.1.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.1.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.1.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.1.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.1.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.2.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.2.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.2.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.2.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.2.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.2.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.3.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.3.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.3.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.3.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.3.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.3.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.4.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.4.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.4.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.4.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.4.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.4.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.5.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.5.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.5.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.5.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.5.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.5.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.6.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.6.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.6.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.6.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.6.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.6.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.7.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.7.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.7.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.7.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.7.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.7.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.8.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.8.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.8.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.8.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.8.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.8.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.9.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.9.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.9.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.9.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.9.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.9.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.10.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.10.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.10.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.10.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.10.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.10.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.11.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.11.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.11.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.11.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.11.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.11.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.12.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.12.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.12.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.12.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.12.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.12.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.13.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.13.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.13.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.13.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.13.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.13.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.14.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.14.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.14.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.14.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.14.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.14.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.15.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.15.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.15.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.15.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.15.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.15.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.16.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.16.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.16.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.16.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.16.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.16.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.17.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.17.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.17.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.17.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.17.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.17.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.18.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.18.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.18.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.18.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.18.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.18.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.19.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.19.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.19.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.19.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.19.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.19.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.20.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.20.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.20.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.20.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.20.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.20.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.21.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.21.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.21.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.21.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.21.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.21.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.22.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.22.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.22.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.22.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.22.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.22.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.23.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.23.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.23.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.23.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.23.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.23.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.24.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.24.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.24.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.24.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.24.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.24.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.25.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.25.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.25.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.25.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.25.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.25.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.26.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.26.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.26.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.26.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.26.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.26.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.27.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.27.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.27.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.27.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.27.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.27.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.28.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.28.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.28.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.28.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.28.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.28.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.29.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.29.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.29.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.29.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.29.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.29.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.30.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.30.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.30.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.30.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.30.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.30.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.31.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.31.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.31.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.31.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.31.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.31.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.32.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.32.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.32.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.32.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.32.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.32.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.33.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.33.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.33.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.33.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.33.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.33.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.34.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.34.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.34.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.34.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.34.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.34.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.35.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.35.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.35.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.35.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.35.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.35.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.36.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.36.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.36.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.36.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.36.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.36.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.37.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.37.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.37.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.37.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.37.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.37.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.38.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.38.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.38.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.38.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.38.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.38.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.39.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.39.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.39.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.39.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.39.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.39.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.40.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.40.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.40.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.40.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.40.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.40.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.41.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.41.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.41.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.41.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.41.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.41.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.42.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.42.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.42.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.42.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.42.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.42.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.43.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.43.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.43.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.43.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.43.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.43.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.44.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.44.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.44.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.44.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.44.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.44.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.45.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.45.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.45.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.45.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.45.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.45.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.46.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.46.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.46.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.46.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.46.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.46.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.47.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.47.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.47.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.47.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.47.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.47.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.48.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.48.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.48.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.48.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.48.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.48.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.49.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.49.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.49.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.49.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.49.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.49.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.50.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.50.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.50.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.50.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.50.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.50.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.51.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.51.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.51.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.51.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.51.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.51.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.52.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.52.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.52.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.52.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.52.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.52.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.53.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.53.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.53.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.53.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.53.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.53.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.54.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.54.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.54.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.54.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.54.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.54.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.55.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.55.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.55.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.55.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.55.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.55.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.56.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.56.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.56.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.56.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.56.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.56.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.57.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.57.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.57.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.57.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.57.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.57.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.58.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.58.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.58.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.58.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.58.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.58.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.59.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.59.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.59.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.59.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.59.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.59.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.60.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.60.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.60.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.60.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.60.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.60.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.61.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.61.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.61.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.61.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.61.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.61.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.62.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.62.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.62.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.62.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.62.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.62.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.63.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.63.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.63.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.63.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.63.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.63.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.64.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.64.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.64.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.64.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.64.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.64.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.65.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.65.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.65.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.65.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.65.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.65.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.66.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.66.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.66.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.66.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.66.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.66.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.67.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.67.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.67.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.67.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.67.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.67.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.68.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.68.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.68.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.68.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.68.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.68.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.69.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.69.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.69.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.69.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.69.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.69.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.70.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.70.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.70.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.70.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.70.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.70.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.71.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.71.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.71.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.71.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.71.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.71.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.72.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.72.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.72.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.72.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.72.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.72.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.73.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.73.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.73.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.73.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.73.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.73.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.74.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.74.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.74.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.74.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.74.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.74.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.75.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.75.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.75.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.75.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.75.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.75.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.76.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.76.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.76.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.76.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.76.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.76.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.77.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.77.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.77.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.77.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.77.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.77.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.78.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.78.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.78.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.78.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.78.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.78.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.79.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.79.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.79.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.79.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.79.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.79.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.80.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.80.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.80.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.80.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.80.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.80.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.81.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.81.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.81.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.81.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.81.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.81.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.82.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.82.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.82.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.82.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.82.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.82.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.83.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.83.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.83.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.83.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.83.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.83.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.84.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.84.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.84.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.84.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.84.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.84.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.85.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.85.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.85.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.85.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.85.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.85.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.86.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.86.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.86.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.86.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.86.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.86.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.87.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.87.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.87.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.87.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.87.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.87.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.88.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.88.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.88.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.88.up_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.88.down_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.88.down_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.89.gate_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.89.gate_proj.weight_scale_inv": "model-00150-of-000163.safetensors", "model.layers.57.mlp.experts.89.up_proj.weight": "model-00150-of-000163.safetensors", - "model.layers.57.mlp.experts.89.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.89.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.89.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.90.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.90.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.90.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.90.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.90.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.90.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.91.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.91.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.91.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.91.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.91.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.91.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.92.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.92.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.92.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.92.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.92.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.92.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.93.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.93.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.93.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.93.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.93.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.93.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.94.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.94.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.94.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.94.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.94.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.94.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.95.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.95.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.95.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.95.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.95.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.95.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.96.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.96.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.96.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.96.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.96.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.96.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.97.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.97.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.97.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.97.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.97.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.97.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.98.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.98.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.98.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.98.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.98.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.98.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.99.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.99.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.99.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.99.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.99.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.99.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.100.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.100.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.100.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.100.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.100.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.100.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.101.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.101.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.101.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.101.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.101.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.101.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.102.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.102.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.102.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.102.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.102.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.102.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.103.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.103.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.103.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.103.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.103.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.103.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.104.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.104.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.104.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.104.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.104.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.104.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.105.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.105.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.105.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.105.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.105.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.105.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.106.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.106.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.106.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.106.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.106.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.106.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.107.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.107.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.107.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.107.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.107.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.107.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.108.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.108.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.108.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.108.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.108.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.108.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.109.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.109.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.109.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.109.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.109.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.109.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.110.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.110.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.110.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.110.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.110.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.110.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.111.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.111.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.111.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.111.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.111.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.111.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.112.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.112.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.112.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.112.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.112.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.112.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.113.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.113.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.113.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.113.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.113.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.113.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.114.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.114.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.114.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.114.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.114.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.114.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.115.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.115.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.115.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.115.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.115.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.115.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.116.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.116.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.116.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.116.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.116.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.116.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.117.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.117.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.117.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.117.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.117.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.117.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.118.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.118.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.118.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.118.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.118.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.118.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.119.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.119.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.119.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.119.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.119.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.119.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.120.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.120.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.120.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.120.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.120.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.120.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.121.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.121.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.121.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.121.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.121.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.121.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.122.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.122.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.122.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.122.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.122.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.122.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.123.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.123.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.123.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.123.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.123.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.123.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.124.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.124.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.124.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.124.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.124.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.124.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.125.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.125.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.125.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.125.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.125.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.125.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.126.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.126.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.126.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.126.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.126.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.126.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.127.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.127.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.127.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.127.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.127.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.127.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.128.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.128.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.128.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.128.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.128.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.128.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.129.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.129.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.129.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.129.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.129.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.129.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.130.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.130.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.130.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.130.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.130.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.130.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.131.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.131.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.131.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.131.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.131.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.131.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.132.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.132.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.132.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.132.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.132.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.132.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.133.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.133.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.133.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.133.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.133.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.133.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.134.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.134.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.134.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.134.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.134.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.134.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.135.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.135.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.135.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.135.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.135.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.135.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.136.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.136.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.136.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.136.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.136.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.136.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.137.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.137.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.137.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.137.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.137.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.137.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.138.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.138.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.138.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.138.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.138.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.138.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.139.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.139.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.139.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.139.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.139.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.139.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.140.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.140.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.140.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.140.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.140.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.140.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.141.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.141.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.141.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.141.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.141.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.141.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.142.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.142.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.142.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.142.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.142.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.142.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.143.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.143.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.143.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.143.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.143.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.143.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.144.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.144.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.144.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.144.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.144.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.144.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.145.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.145.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.145.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.145.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.145.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.145.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.146.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.146.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.146.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.146.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.146.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.146.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.147.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.147.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.147.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.147.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.147.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.147.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.148.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.148.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.148.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.148.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.148.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.148.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.149.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.149.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.149.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.149.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.149.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.149.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.150.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.150.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.150.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.150.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.150.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.150.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.151.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.151.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.151.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.151.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.151.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.151.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.152.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.152.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.152.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.152.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.152.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.152.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.153.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.153.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.153.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.153.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.153.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.153.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.154.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.154.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.154.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.154.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.154.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.154.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.155.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.155.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.155.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.155.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.155.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.155.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.156.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.156.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.156.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.156.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.156.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.156.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.157.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.157.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.157.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.157.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.157.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.157.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.158.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.158.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.158.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.158.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.158.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.158.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.159.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.159.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.159.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.159.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.159.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.159.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.160.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.160.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.160.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.160.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.160.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.160.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.161.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.161.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.161.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.161.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.161.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.161.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.162.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.162.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.162.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.162.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.162.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.162.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.163.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.163.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.163.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.163.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.163.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.163.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.164.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.164.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.164.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.164.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.164.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.164.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.165.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.165.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.165.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.165.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.165.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.165.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.166.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.166.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.166.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.166.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.166.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.166.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.167.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.167.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.167.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.167.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.167.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.167.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.168.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.168.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.168.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.168.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.168.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.168.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.169.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.169.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.169.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.169.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.169.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.169.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.170.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.170.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.170.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.170.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.170.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.170.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.171.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.171.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.171.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.171.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.171.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.171.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.172.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.172.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.172.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.172.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.172.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.172.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.173.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.173.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.173.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.173.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.173.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.173.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.174.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.174.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.174.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.174.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.174.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.174.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.175.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.175.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.175.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.175.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.175.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.175.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.176.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.176.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.176.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.176.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.176.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.176.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.177.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.177.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.177.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.177.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.177.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.177.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.178.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.178.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.178.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.178.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.178.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.178.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.179.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.179.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.179.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.179.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.179.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.179.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.180.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.180.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.180.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.180.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.180.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.180.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.181.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.181.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.181.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.181.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.181.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.181.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.182.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.182.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.182.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.182.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.182.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.182.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.183.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.183.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.183.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.183.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.183.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.183.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.184.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.184.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.184.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.184.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.184.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.184.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.185.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.185.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.185.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.185.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.185.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.185.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.186.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.186.gate_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.186.up_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.186.up_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.186.down_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.186.down_proj.weight_scale_inv": "model-00151-of-000163.safetensors", "model.layers.57.mlp.experts.187.gate_proj.weight": "model-00151-of-000163.safetensors", - "model.layers.57.mlp.experts.187.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.187.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.187.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.187.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.187.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.188.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.188.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.188.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.188.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.188.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.188.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.189.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.189.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.189.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.189.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.189.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.189.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.190.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.190.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.190.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.190.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.190.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.190.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.191.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.191.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.191.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.191.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.191.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.191.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.192.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.192.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.192.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.192.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.192.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.192.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.193.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.193.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.193.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.193.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.193.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.193.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.194.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.194.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.194.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.194.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.194.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.194.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.195.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.195.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.195.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.195.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.195.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.195.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.196.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.196.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.196.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.196.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.196.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.196.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.197.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.197.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.197.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.197.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.197.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.197.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.198.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.198.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.198.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.198.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.198.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.198.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.199.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.199.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.199.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.199.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.199.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.199.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.200.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.200.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.200.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.200.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.200.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.200.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.201.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.201.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.201.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.201.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.201.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.201.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.202.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.202.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.202.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.202.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.202.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.202.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.203.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.203.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.203.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.203.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.203.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.203.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.204.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.204.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.204.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.204.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.204.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.204.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.205.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.205.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.205.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.205.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.205.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.205.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.206.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.206.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.206.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.206.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.206.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.206.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.207.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.207.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.207.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.207.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.207.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.207.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.208.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.208.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.208.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.208.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.208.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.208.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.209.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.209.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.209.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.209.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.209.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.209.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.210.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.210.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.210.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.210.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.210.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.210.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.211.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.211.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.211.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.211.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.211.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.211.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.212.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.212.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.212.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.212.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.212.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.212.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.213.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.213.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.213.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.213.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.213.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.213.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.214.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.214.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.214.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.214.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.214.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.214.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.215.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.215.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.215.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.215.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.215.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.215.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.216.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.216.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.216.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.216.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.216.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.216.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.217.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.217.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.217.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.217.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.217.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.217.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.218.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.218.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.218.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.218.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.218.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.218.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.219.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.219.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.219.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.219.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.219.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.219.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.220.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.220.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.220.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.220.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.220.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.220.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.221.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.221.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.221.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.221.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.221.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.221.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.222.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.222.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.222.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.222.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.222.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.222.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.223.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.223.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.223.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.223.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.223.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.223.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.224.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.224.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.224.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.224.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.224.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.224.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.225.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.225.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.225.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.225.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.225.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.225.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.226.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.226.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.226.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.226.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.226.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.226.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.227.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.227.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.227.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.227.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.227.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.227.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.228.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.228.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.228.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.228.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.228.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.228.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.229.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.229.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.229.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.229.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.229.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.229.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.230.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.230.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.230.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.230.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.230.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.230.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.231.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.231.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.231.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.231.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.231.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.231.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.232.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.232.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.232.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.232.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.232.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.232.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.233.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.233.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.233.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.233.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.233.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.233.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.234.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.234.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.234.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.234.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.234.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.234.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.235.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.235.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.235.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.235.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.235.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.235.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.236.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.236.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.236.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.236.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.236.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.236.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.237.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.237.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.237.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.237.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.237.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.237.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.238.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.238.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.238.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.238.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.238.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.238.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.239.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.239.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.239.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.239.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.239.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.239.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.240.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.240.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.240.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.240.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.240.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.240.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.241.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.241.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.241.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.241.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.241.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.241.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.242.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.242.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.242.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.242.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.242.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.242.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.243.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.243.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.243.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.243.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.243.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.243.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.244.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.244.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.244.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.244.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.244.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.244.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.245.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.245.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.245.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.245.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.245.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.245.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.246.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.246.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.246.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.246.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.246.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.246.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.247.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.247.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.247.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.247.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.247.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.247.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.248.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.248.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.248.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.248.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.248.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.248.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.249.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.249.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.249.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.249.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.249.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.249.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.250.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.250.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.250.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.250.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.250.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.250.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.251.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.251.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.251.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.251.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.251.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.251.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.252.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.252.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.252.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.252.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.252.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.252.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.253.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.253.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.253.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.253.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.253.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.253.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.254.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.254.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.254.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.254.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.254.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.254.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.255.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.255.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.255.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.255.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.mlp.experts.255.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.57.mlp.experts.255.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.57.input_layernorm.weight": "model-00152-of-000163.safetensors", "model.layers.57.post_attention_layernorm.weight": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.q_a_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.self_attn.q_a_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.q_a_layernorm.weight": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.q_b_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.self_attn.q_b_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.kv_a_proj_with_mqa.weight": "model-00152-of-000163.safetensors", - "model.layers.58.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.kv_a_layernorm.weight": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.kv_b_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.self_attn.kv_b_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.self_attn.o_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.self_attn.o_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.gate.weight": "model-00152-of-000163.safetensors", "model.layers.58.mlp.gate.e_score_correction_bias": "model-00152-of-000163.safetensors", "model.layers.58.mlp.shared_experts.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.shared_experts.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.shared_experts.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.shared_experts.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.shared_experts.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.0.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.0.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.0.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.0.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.0.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.0.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.1.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.1.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.1.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.1.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.1.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.1.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.2.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.2.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.2.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.2.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.2.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.2.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.3.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.3.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.3.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.3.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.3.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.3.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.4.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.4.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.4.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.4.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.4.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.4.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.5.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.5.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.5.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.5.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.5.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.5.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.6.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.6.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.6.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.6.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.6.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.6.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.7.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.7.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.7.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.7.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.7.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.7.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.8.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.8.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.8.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.8.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.8.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.8.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.9.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.9.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.9.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.9.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.9.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.9.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.10.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.10.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.10.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.10.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.10.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.10.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.11.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.11.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.11.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.11.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.11.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.11.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.12.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.12.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.12.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.12.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.12.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.12.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.13.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.13.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.13.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.13.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.13.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.13.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.14.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.14.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.14.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.14.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.14.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.14.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.15.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.15.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.15.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.15.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.15.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.15.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.16.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.16.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.16.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.16.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.16.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.16.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.17.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.17.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.17.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.17.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.17.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.17.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.18.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.18.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.18.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.18.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.18.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.18.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.19.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.19.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.19.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.19.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.19.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.19.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.20.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.20.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.20.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.20.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.20.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.20.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.21.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.21.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.21.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.21.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.21.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.21.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.22.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.22.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.22.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.22.up_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.22.down_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.22.down_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.23.gate_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.23.gate_proj.weight_scale_inv": "model-00152-of-000163.safetensors", "model.layers.58.mlp.experts.23.up_proj.weight": "model-00152-of-000163.safetensors", - "model.layers.58.mlp.experts.23.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.23.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.23.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.24.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.24.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.24.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.24.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.24.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.24.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.25.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.25.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.25.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.25.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.25.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.25.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.26.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.26.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.26.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.26.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.26.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.26.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.27.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.27.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.27.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.27.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.27.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.27.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.28.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.28.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.28.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.28.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.28.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.28.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.29.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.29.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.29.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.29.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.29.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.29.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.30.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.30.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.30.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.30.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.30.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.30.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.31.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.31.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.31.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.31.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.31.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.31.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.32.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.32.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.32.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.32.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.32.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.32.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.33.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.33.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.33.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.33.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.33.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.33.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.34.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.34.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.34.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.34.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.34.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.34.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.35.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.35.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.35.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.35.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.35.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.35.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.36.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.36.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.36.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.36.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.36.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.36.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.37.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.37.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.37.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.37.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.37.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.37.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.38.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.38.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.38.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.38.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.38.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.38.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.39.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.39.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.39.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.39.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.39.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.39.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.40.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.40.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.40.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.40.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.40.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.40.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.41.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.41.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.41.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.41.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.41.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.41.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.42.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.42.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.42.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.42.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.42.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.42.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.43.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.43.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.43.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.43.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.43.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.43.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.44.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.44.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.44.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.44.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.44.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.44.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.45.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.45.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.45.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.45.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.45.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.45.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.46.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.46.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.46.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.46.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.46.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.46.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.47.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.47.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.47.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.47.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.47.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.47.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.48.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.48.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.48.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.48.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.48.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.48.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.49.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.49.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.49.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.49.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.49.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.49.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.50.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.50.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.50.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.50.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.50.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.50.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.51.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.51.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.51.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.51.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.51.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.51.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.52.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.52.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.52.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.52.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.52.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.52.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.53.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.53.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.53.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.53.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.53.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.53.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.54.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.54.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.54.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.54.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.54.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.54.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.55.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.55.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.55.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.55.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.55.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.55.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.56.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.56.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.56.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.56.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.56.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.56.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.57.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.57.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.57.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.57.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.57.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.57.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.58.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.58.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.58.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.58.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.58.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.58.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.59.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.59.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.59.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.59.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.59.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.59.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.60.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.60.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.60.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.60.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.60.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.60.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.61.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.61.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.61.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.61.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.61.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.61.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.62.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.62.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.62.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.62.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.62.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.62.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.63.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.63.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.63.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.63.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.63.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.63.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.64.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.64.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.64.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.64.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.64.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.64.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.65.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.65.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.65.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.65.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.65.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.65.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.66.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.66.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.66.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.66.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.66.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.66.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.67.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.67.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.67.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.67.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.67.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.67.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.68.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.68.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.68.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.68.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.68.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.68.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.69.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.69.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.69.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.69.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.69.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.69.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.70.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.70.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.70.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.70.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.70.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.70.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.71.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.71.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.71.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.71.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.71.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.71.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.72.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.72.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.72.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.72.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.72.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.72.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.73.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.73.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.73.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.73.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.73.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.73.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.74.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.74.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.74.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.74.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.74.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.74.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.75.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.75.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.75.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.75.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.75.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.75.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.76.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.76.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.76.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.76.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.76.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.76.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.77.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.77.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.77.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.77.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.77.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.77.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.78.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.78.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.78.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.78.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.78.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.78.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.79.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.79.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.79.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.79.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.79.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.79.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.80.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.80.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.80.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.80.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.80.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.80.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.81.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.81.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.81.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.81.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.81.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.81.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.82.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.82.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.82.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.82.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.82.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.82.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.83.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.83.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.83.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.83.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.83.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.83.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.84.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.84.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.84.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.84.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.84.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.84.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.85.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.85.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.85.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.85.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.85.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.85.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.86.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.86.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.86.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.86.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.86.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.86.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.87.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.87.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.87.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.87.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.87.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.87.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.88.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.88.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.88.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.88.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.88.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.88.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.89.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.89.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.89.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.89.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.89.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.89.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.90.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.90.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.90.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.90.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.90.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.90.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.91.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.91.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.91.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.91.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.91.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.91.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.92.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.92.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.92.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.92.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.92.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.92.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.93.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.93.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.93.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.93.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.93.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.93.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.94.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.94.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.94.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.94.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.94.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.94.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.95.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.95.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.95.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.95.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.95.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.95.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.96.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.96.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.96.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.96.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.96.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.96.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.97.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.97.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.97.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.97.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.97.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.97.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.98.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.98.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.98.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.98.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.98.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.98.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.99.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.99.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.99.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.99.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.99.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.99.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.100.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.100.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.100.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.100.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.100.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.100.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.101.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.101.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.101.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.101.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.101.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.101.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.102.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.102.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.102.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.102.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.102.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.102.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.103.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.103.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.103.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.103.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.103.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.103.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.104.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.104.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.104.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.104.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.104.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.104.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.105.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.105.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.105.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.105.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.105.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.105.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.106.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.106.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.106.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.106.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.106.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.106.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.107.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.107.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.107.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.107.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.107.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.107.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.108.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.108.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.108.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.108.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.108.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.108.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.109.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.109.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.109.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.109.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.109.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.109.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.110.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.110.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.110.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.110.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.110.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.110.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.111.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.111.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.111.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.111.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.111.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.111.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.112.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.112.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.112.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.112.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.112.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.112.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.113.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.113.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.113.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.113.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.113.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.113.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.114.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.114.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.114.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.114.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.114.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.114.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.115.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.115.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.115.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.115.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.115.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.115.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.116.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.116.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.116.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.116.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.116.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.116.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.117.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.117.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.117.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.117.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.117.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.117.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.118.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.118.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.118.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.118.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.118.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.118.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.119.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.119.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.119.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.119.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.119.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.119.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.120.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.120.gate_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.120.up_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.120.up_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.120.down_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.120.down_proj.weight_scale_inv": "model-00153-of-000163.safetensors", "model.layers.58.mlp.experts.121.gate_proj.weight": "model-00153-of-000163.safetensors", - "model.layers.58.mlp.experts.121.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.121.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.121.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.121.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.121.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.122.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.122.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.122.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.122.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.122.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.122.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.123.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.123.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.123.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.123.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.123.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.123.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.124.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.124.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.124.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.124.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.124.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.124.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.125.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.125.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.125.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.125.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.125.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.125.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.126.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.126.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.126.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.126.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.126.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.126.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.127.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.127.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.127.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.127.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.127.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.127.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.128.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.128.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.128.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.128.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.128.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.128.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.129.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.129.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.129.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.129.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.129.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.129.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.130.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.130.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.130.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.130.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.130.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.130.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.131.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.131.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.131.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.131.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.131.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.131.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.132.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.132.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.132.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.132.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.132.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.132.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.133.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.133.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.133.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.133.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.133.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.133.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.134.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.134.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.134.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.134.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.134.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.134.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.135.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.135.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.135.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.135.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.135.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.135.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.136.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.136.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.136.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.136.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.136.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.136.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.137.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.137.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.137.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.137.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.137.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.137.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.138.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.138.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.138.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.138.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.138.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.138.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.139.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.139.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.139.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.139.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.139.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.139.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.140.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.140.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.140.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.140.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.140.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.140.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.141.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.141.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.141.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.141.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.141.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.141.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.142.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.142.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.142.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.142.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.142.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.142.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.143.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.143.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.143.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.143.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.143.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.143.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.144.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.144.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.144.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.144.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.144.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.144.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.145.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.145.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.145.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.145.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.145.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.145.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.146.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.146.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.146.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.146.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.146.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.146.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.147.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.147.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.147.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.147.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.147.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.147.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.148.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.148.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.148.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.148.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.148.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.148.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.149.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.149.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.149.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.149.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.149.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.149.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.150.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.150.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.150.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.150.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.150.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.150.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.151.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.151.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.151.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.151.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.151.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.151.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.152.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.152.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.152.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.152.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.152.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.152.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.153.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.153.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.153.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.153.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.153.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.153.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.154.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.154.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.154.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.154.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.154.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.154.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.155.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.155.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.155.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.155.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.155.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.155.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.156.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.156.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.156.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.156.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.156.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.156.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.157.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.157.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.157.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.157.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.157.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.157.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.158.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.158.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.158.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.158.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.158.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.158.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.159.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.159.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.159.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.159.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.159.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.159.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.160.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.160.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.160.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.160.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.160.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.160.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.161.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.161.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.161.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.161.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.161.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.161.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.162.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.162.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.162.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.162.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.162.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.162.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.163.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.163.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.163.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.163.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.163.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.163.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.164.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.164.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.164.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.164.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.164.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.164.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.165.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.165.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.165.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.165.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.165.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.165.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.166.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.166.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.166.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.166.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.166.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.166.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.167.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.167.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.167.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.167.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.167.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.167.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.168.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.168.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.168.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.168.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.168.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.168.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.169.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.169.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.169.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.169.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.169.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.169.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.170.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.170.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.170.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.170.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.170.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.170.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.171.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.171.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.171.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.171.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.171.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.171.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.172.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.172.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.172.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.172.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.172.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.172.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.173.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.173.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.173.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.173.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.173.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.173.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.174.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.174.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.174.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.174.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.174.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.174.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.175.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.175.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.175.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.175.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.175.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.175.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.176.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.176.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.176.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.176.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.176.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.176.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.177.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.177.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.177.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.177.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.177.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.177.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.178.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.178.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.178.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.178.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.178.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.178.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.179.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.179.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.179.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.179.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.179.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.179.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.180.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.180.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.180.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.180.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.180.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.180.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.181.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.181.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.181.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.181.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.181.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.181.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.182.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.182.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.182.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.182.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.182.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.182.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.183.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.183.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.183.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.183.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.183.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.183.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.184.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.184.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.184.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.184.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.184.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.184.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.185.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.185.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.185.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.185.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.185.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.185.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.186.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.186.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.186.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.186.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.186.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.186.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.187.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.187.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.187.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.187.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.187.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.187.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.188.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.188.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.188.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.188.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.188.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.188.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.189.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.189.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.189.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.189.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.189.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.189.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.190.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.190.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.190.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.190.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.190.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.190.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.191.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.191.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.191.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.191.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.191.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.191.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.192.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.192.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.192.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.192.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.192.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.192.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.193.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.193.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.193.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.193.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.193.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.193.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.194.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.194.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.194.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.194.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.194.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.194.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.195.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.195.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.195.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.195.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.195.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.195.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.196.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.196.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.196.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.196.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.196.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.196.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.197.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.197.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.197.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.197.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.197.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.197.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.198.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.198.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.198.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.198.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.198.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.198.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.199.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.199.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.199.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.199.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.199.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.199.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.200.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.200.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.200.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.200.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.200.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.200.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.201.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.201.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.201.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.201.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.201.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.201.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.202.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.202.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.202.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.202.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.202.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.202.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.203.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.203.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.203.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.203.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.203.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.203.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.204.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.204.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.204.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.204.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.204.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.204.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.205.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.205.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.205.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.205.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.205.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.205.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.206.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.206.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.206.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.206.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.206.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.206.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.207.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.207.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.207.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.207.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.207.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.207.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.208.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.208.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.208.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.208.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.208.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.208.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.209.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.209.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.209.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.209.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.209.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.209.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.210.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.210.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.210.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.210.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.210.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.210.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.211.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.211.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.211.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.211.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.211.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.211.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.212.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.212.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.212.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.212.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.212.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.212.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.213.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.213.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.213.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.213.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.213.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.213.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.214.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.214.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.214.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.214.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.214.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.214.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.215.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.215.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.215.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.215.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.215.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.215.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.216.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.216.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.216.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.216.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.216.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.216.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.217.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.217.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.217.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.217.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.217.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.217.down_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.218.gate_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.218.gate_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.218.up_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.218.up_proj.weight_scale_inv": "model-00154-of-000163.safetensors", "model.layers.58.mlp.experts.218.down_proj.weight": "model-00154-of-000163.safetensors", - "model.layers.58.mlp.experts.218.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.219.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.219.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.219.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.219.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.219.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.219.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.220.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.220.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.220.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.220.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.220.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.220.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.221.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.221.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.221.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.221.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.221.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.221.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.222.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.222.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.222.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.222.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.222.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.222.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.223.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.223.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.223.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.223.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.223.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.223.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.224.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.224.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.224.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.224.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.224.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.224.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.225.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.225.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.225.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.225.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.225.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.225.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.226.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.226.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.226.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.226.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.226.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.226.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.227.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.227.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.227.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.227.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.227.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.227.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.228.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.228.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.228.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.228.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.228.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.228.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.229.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.229.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.229.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.229.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.229.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.229.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.230.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.230.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.230.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.230.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.230.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.230.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.231.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.231.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.231.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.231.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.231.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.231.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.232.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.232.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.232.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.232.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.232.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.232.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.233.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.233.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.233.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.233.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.233.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.233.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.234.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.234.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.234.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.234.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.234.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.234.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.235.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.235.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.235.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.235.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.235.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.235.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.236.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.236.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.236.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.236.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.236.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.236.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.237.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.237.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.237.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.237.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.237.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.237.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.238.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.238.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.238.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.238.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.238.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.238.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.239.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.239.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.239.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.239.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.239.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.239.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.240.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.240.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.240.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.240.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.240.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.240.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.241.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.241.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.241.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.241.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.241.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.241.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.242.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.242.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.242.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.242.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.242.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.242.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.243.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.243.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.243.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.243.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.243.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.243.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.244.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.244.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.244.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.244.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.244.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.244.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.245.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.245.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.245.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.245.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.245.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.245.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.246.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.246.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.246.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.246.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.246.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.246.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.247.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.247.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.247.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.247.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.247.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.247.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.248.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.248.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.248.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.248.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.248.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.248.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.249.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.249.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.249.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.249.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.249.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.249.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.250.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.250.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.250.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.250.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.250.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.250.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.251.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.251.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.251.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.251.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.251.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.251.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.252.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.252.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.252.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.252.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.252.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.252.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.253.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.253.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.253.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.253.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.253.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.253.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.254.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.254.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.254.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.254.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.254.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.254.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.255.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.255.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.255.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.255.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.mlp.experts.255.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.58.mlp.experts.255.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.58.input_layernorm.weight": "model-00155-of-000163.safetensors", "model.layers.58.post_attention_layernorm.weight": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.q_a_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.self_attn.q_a_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.q_a_layernorm.weight": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.q_b_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.self_attn.q_b_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.kv_a_proj_with_mqa.weight": "model-00155-of-000163.safetensors", - "model.layers.59.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.kv_a_layernorm.weight": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.kv_b_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.self_attn.kv_b_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.self_attn.o_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.self_attn.o_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.gate.weight": "model-00155-of-000163.safetensors", "model.layers.59.mlp.gate.e_score_correction_bias": "model-00155-of-000163.safetensors", "model.layers.59.mlp.shared_experts.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.shared_experts.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.shared_experts.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.shared_experts.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.shared_experts.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.0.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.0.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.0.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.0.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.0.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.0.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.1.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.1.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.1.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.1.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.1.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.1.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.2.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.2.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.2.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.2.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.2.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.2.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.3.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.3.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.3.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.3.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.3.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.3.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.4.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.4.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.4.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.4.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.4.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.4.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.5.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.5.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.5.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.5.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.5.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.5.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.6.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.6.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.6.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.6.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.6.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.6.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.7.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.7.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.7.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.7.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.7.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.7.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.8.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.8.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.8.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.8.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.8.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.8.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.9.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.9.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.9.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.9.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.9.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.9.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.10.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.10.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.10.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.10.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.10.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.10.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.11.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.11.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.11.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.11.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.11.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.11.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.12.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.12.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.12.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.12.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.12.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.12.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.13.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.13.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.13.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.13.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.13.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.13.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.14.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.14.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.14.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.14.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.14.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.14.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.15.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.15.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.15.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.15.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.15.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.15.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.16.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.16.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.16.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.16.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.16.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.16.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.17.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.17.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.17.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.17.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.17.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.17.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.18.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.18.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.18.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.18.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.18.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.18.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.19.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.19.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.19.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.19.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.19.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.19.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.20.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.20.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.20.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.20.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.20.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.20.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.21.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.21.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.21.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.21.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.21.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.21.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.22.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.22.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.22.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.22.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.22.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.22.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.23.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.23.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.23.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.23.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.23.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.23.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.24.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.24.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.24.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.24.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.24.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.24.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.25.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.25.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.25.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.25.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.25.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.25.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.26.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.26.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.26.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.26.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.26.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.26.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.27.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.27.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.27.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.27.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.27.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.27.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.28.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.28.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.28.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.28.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.28.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.28.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.29.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.29.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.29.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.29.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.29.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.29.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.30.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.30.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.30.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.30.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.30.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.30.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.31.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.31.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.31.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.31.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.31.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.31.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.32.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.32.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.32.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.32.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.32.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.32.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.33.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.33.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.33.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.33.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.33.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.33.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.34.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.34.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.34.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.34.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.34.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.34.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.35.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.35.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.35.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.35.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.35.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.35.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.36.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.36.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.36.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.36.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.36.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.36.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.37.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.37.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.37.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.37.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.37.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.37.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.38.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.38.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.38.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.38.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.38.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.38.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.39.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.39.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.39.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.39.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.39.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.39.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.40.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.40.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.40.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.40.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.40.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.40.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.41.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.41.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.41.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.41.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.41.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.41.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.42.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.42.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.42.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.42.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.42.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.42.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.43.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.43.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.43.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.43.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.43.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.43.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.44.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.44.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.44.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.44.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.44.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.44.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.45.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.45.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.45.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.45.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.45.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.45.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.46.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.46.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.46.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.46.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.46.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.46.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.47.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.47.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.47.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.47.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.47.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.47.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.48.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.48.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.48.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.48.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.48.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.48.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.49.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.49.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.49.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.49.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.49.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.49.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.50.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.50.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.50.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.50.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.50.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.50.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.51.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.51.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.51.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.51.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.51.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.51.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.52.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.52.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.52.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.52.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.52.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.52.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.53.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.53.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.53.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.53.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.53.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.53.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.54.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.54.gate_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.54.up_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.54.up_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.54.down_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.54.down_proj.weight_scale_inv": "model-00155-of-000163.safetensors", "model.layers.59.mlp.experts.55.gate_proj.weight": "model-00155-of-000163.safetensors", - "model.layers.59.mlp.experts.55.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.55.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.55.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.55.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.55.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.56.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.56.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.56.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.56.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.56.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.56.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.57.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.57.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.57.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.57.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.57.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.57.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.58.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.58.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.58.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.58.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.58.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.58.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.59.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.59.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.59.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.59.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.59.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.59.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.60.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.60.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.60.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.60.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.60.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.60.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.61.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.61.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.61.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.61.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.61.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.61.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.62.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.62.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.62.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.62.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.62.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.62.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.63.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.63.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.63.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.63.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.63.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.63.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.64.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.64.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.64.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.64.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.64.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.64.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.65.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.65.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.65.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.65.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.65.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.65.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.66.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.66.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.66.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.66.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.66.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.66.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.67.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.67.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.67.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.67.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.67.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.67.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.68.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.68.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.68.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.68.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.68.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.68.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.69.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.69.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.69.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.69.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.69.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.69.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.70.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.70.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.70.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.70.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.70.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.70.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.71.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.71.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.71.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.71.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.71.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.71.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.72.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.72.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.72.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.72.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.72.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.72.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.73.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.73.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.73.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.73.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.73.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.73.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.74.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.74.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.74.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.74.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.74.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.74.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.75.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.75.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.75.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.75.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.75.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.75.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.76.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.76.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.76.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.76.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.76.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.76.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.77.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.77.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.77.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.77.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.77.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.77.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.78.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.78.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.78.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.78.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.78.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.78.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.79.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.79.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.79.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.79.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.79.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.79.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.80.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.80.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.80.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.80.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.80.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.80.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.81.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.81.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.81.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.81.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.81.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.81.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.82.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.82.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.82.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.82.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.82.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.82.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.83.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.83.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.83.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.83.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.83.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.83.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.84.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.84.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.84.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.84.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.84.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.84.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.85.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.85.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.85.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.85.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.85.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.85.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.86.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.86.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.86.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.86.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.86.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.86.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.87.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.87.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.87.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.87.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.87.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.87.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.88.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.88.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.88.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.88.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.88.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.88.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.89.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.89.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.89.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.89.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.89.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.89.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.90.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.90.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.90.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.90.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.90.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.90.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.91.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.91.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.91.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.91.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.91.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.91.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.92.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.92.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.92.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.92.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.92.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.92.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.93.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.93.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.93.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.93.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.93.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.93.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.94.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.94.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.94.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.94.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.94.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.94.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.95.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.95.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.95.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.95.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.95.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.95.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.96.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.96.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.96.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.96.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.96.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.96.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.97.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.97.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.97.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.97.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.97.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.97.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.98.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.98.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.98.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.98.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.98.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.98.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.99.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.99.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.99.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.99.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.99.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.99.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.100.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.100.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.100.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.100.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.100.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.100.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.101.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.101.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.101.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.101.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.101.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.101.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.102.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.102.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.102.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.102.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.102.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.102.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.103.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.103.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.103.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.103.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.103.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.103.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.104.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.104.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.104.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.104.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.104.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.104.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.105.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.105.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.105.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.105.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.105.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.105.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.106.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.106.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.106.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.106.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.106.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.106.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.107.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.107.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.107.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.107.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.107.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.107.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.108.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.108.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.108.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.108.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.108.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.108.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.109.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.109.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.109.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.109.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.109.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.109.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.110.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.110.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.110.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.110.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.110.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.110.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.111.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.111.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.111.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.111.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.111.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.111.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.112.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.112.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.112.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.112.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.112.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.112.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.113.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.113.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.113.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.113.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.113.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.113.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.114.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.114.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.114.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.114.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.114.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.114.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.115.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.115.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.115.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.115.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.115.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.115.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.116.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.116.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.116.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.116.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.116.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.116.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.117.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.117.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.117.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.117.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.117.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.117.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.118.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.118.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.118.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.118.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.118.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.118.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.119.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.119.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.119.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.119.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.119.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.119.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.120.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.120.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.120.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.120.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.120.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.120.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.121.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.121.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.121.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.121.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.121.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.121.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.122.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.122.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.122.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.122.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.122.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.122.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.123.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.123.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.123.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.123.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.123.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.123.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.124.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.124.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.124.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.124.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.124.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.124.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.125.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.125.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.125.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.125.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.125.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.125.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.126.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.126.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.126.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.126.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.126.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.126.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.127.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.127.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.127.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.127.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.127.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.127.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.128.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.128.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.128.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.128.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.128.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.128.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.129.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.129.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.129.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.129.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.129.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.129.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.130.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.130.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.130.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.130.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.130.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.130.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.131.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.131.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.131.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.131.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.131.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.131.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.132.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.132.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.132.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.132.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.132.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.132.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.133.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.133.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.133.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.133.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.133.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.133.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.134.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.134.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.134.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.134.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.134.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.134.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.135.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.135.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.135.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.135.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.135.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.135.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.136.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.136.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.136.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.136.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.136.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.136.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.137.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.137.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.137.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.137.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.137.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.137.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.138.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.138.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.138.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.138.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.138.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.138.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.139.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.139.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.139.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.139.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.139.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.139.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.140.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.140.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.140.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.140.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.140.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.140.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.141.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.141.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.141.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.141.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.141.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.141.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.142.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.142.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.142.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.142.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.142.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.142.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.143.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.143.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.143.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.143.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.143.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.143.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.144.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.144.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.144.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.144.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.144.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.144.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.145.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.145.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.145.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.145.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.145.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.145.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.146.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.146.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.146.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.146.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.146.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.146.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.147.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.147.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.147.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.147.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.147.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.147.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.148.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.148.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.148.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.148.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.148.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.148.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.149.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.149.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.149.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.149.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.149.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.149.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.150.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.150.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.150.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.150.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.150.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.150.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.151.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.151.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.151.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.151.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.151.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.151.down_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.152.gate_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.152.gate_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.152.up_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.152.up_proj.weight_scale_inv": "model-00156-of-000163.safetensors", "model.layers.59.mlp.experts.152.down_proj.weight": "model-00156-of-000163.safetensors", - "model.layers.59.mlp.experts.152.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.153.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.153.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.153.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.153.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.153.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.153.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.154.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.154.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.154.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.154.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.154.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.154.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.155.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.155.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.155.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.155.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.155.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.155.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.156.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.156.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.156.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.156.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.156.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.156.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.157.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.157.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.157.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.157.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.157.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.157.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.158.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.158.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.158.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.158.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.158.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.158.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.159.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.159.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.159.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.159.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.159.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.159.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.160.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.160.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.160.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.160.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.160.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.160.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.161.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.161.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.161.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.161.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.161.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.161.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.162.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.162.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.162.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.162.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.162.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.162.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.163.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.163.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.163.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.163.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.163.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.163.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.164.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.164.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.164.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.164.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.164.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.164.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.165.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.165.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.165.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.165.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.165.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.165.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.166.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.166.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.166.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.166.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.166.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.166.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.167.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.167.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.167.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.167.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.167.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.167.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.168.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.168.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.168.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.168.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.168.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.168.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.169.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.169.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.169.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.169.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.169.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.169.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.170.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.170.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.170.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.170.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.170.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.170.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.171.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.171.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.171.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.171.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.171.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.171.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.172.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.172.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.172.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.172.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.172.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.172.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.173.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.173.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.173.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.173.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.173.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.173.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.174.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.174.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.174.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.174.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.174.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.174.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.175.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.175.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.175.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.175.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.175.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.175.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.176.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.176.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.176.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.176.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.176.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.176.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.177.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.177.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.177.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.177.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.177.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.177.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.178.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.178.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.178.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.178.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.178.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.178.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.179.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.179.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.179.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.179.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.179.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.179.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.180.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.180.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.180.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.180.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.180.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.180.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.181.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.181.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.181.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.181.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.181.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.181.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.182.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.182.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.182.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.182.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.182.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.182.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.183.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.183.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.183.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.183.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.183.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.183.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.184.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.184.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.184.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.184.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.184.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.184.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.185.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.185.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.185.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.185.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.185.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.185.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.186.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.186.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.186.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.186.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.186.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.186.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.187.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.187.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.187.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.187.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.187.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.187.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.188.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.188.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.188.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.188.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.188.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.188.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.189.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.189.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.189.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.189.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.189.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.189.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.190.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.190.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.190.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.190.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.190.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.190.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.191.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.191.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.191.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.191.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.191.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.191.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.192.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.192.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.192.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.192.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.192.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.192.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.193.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.193.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.193.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.193.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.193.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.193.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.194.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.194.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.194.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.194.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.194.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.194.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.195.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.195.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.195.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.195.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.195.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.195.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.196.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.196.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.196.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.196.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.196.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.196.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.197.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.197.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.197.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.197.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.197.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.197.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.198.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.198.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.198.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.198.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.198.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.198.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.199.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.199.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.199.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.199.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.199.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.199.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.200.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.200.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.200.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.200.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.200.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.200.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.201.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.201.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.201.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.201.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.201.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.201.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.202.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.202.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.202.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.202.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.202.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.202.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.203.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.203.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.203.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.203.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.203.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.203.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.204.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.204.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.204.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.204.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.204.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.204.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.205.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.205.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.205.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.205.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.205.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.205.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.206.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.206.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.206.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.206.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.206.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.206.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.207.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.207.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.207.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.207.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.207.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.207.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.208.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.208.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.208.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.208.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.208.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.208.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.209.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.209.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.209.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.209.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.209.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.209.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.210.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.210.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.210.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.210.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.210.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.210.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.211.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.211.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.211.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.211.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.211.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.211.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.212.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.212.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.212.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.212.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.212.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.212.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.213.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.213.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.213.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.213.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.213.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.213.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.214.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.214.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.214.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.214.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.214.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.214.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.215.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.215.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.215.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.215.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.215.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.215.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.216.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.216.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.216.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.216.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.216.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.216.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.217.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.217.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.217.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.217.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.217.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.217.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.218.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.218.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.218.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.218.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.218.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.218.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.219.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.219.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.219.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.219.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.219.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.219.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.220.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.220.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.220.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.220.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.220.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.220.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.221.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.221.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.221.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.221.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.221.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.221.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.222.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.222.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.222.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.222.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.222.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.222.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.223.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.223.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.223.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.223.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.223.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.223.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.224.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.224.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.224.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.224.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.224.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.224.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.225.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.225.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.225.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.225.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.225.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.225.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.226.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.226.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.226.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.226.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.226.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.226.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.227.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.227.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.227.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.227.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.227.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.227.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.228.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.228.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.228.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.228.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.228.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.228.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.229.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.229.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.229.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.229.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.229.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.229.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.230.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.230.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.230.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.230.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.230.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.230.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.231.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.231.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.231.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.231.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.231.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.231.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.232.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.232.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.232.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.232.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.232.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.232.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.233.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.233.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.233.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.233.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.233.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.233.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.234.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.234.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.234.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.234.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.234.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.234.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.235.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.235.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.235.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.235.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.235.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.235.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.236.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.236.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.236.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.236.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.236.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.236.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.237.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.237.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.237.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.237.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.237.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.237.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.238.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.238.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.238.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.238.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.238.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.238.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.239.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.239.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.239.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.239.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.239.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.239.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.240.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.240.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.240.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.240.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.240.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.240.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.241.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.241.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.241.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.241.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.241.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.241.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.242.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.242.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.242.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.242.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.242.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.242.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.243.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.243.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.243.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.243.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.243.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.243.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.244.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.244.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.244.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.244.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.244.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.244.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.245.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.245.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.245.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.245.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.245.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.245.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.246.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.246.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.246.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.246.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.246.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.246.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.247.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.247.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.247.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.247.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.247.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.247.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.248.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.248.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.248.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.248.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.248.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.248.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.249.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.249.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.249.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.249.up_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.249.down_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.249.down_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.250.gate_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.250.gate_proj.weight_scale_inv": "model-00157-of-000163.safetensors", "model.layers.59.mlp.experts.250.up_proj.weight": "model-00157-of-000163.safetensors", - "model.layers.59.mlp.experts.250.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.250.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.250.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.251.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.251.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.251.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.251.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.251.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.251.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.252.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.252.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.252.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.252.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.252.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.252.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.253.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.253.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.253.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.253.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.253.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.253.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.254.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.254.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.254.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.254.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.254.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.254.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.255.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.255.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.255.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.255.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.mlp.experts.255.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.59.mlp.experts.255.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.59.input_layernorm.weight": "model-00158-of-000163.safetensors", "model.layers.59.post_attention_layernorm.weight": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.q_a_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.self_attn.q_a_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.q_a_layernorm.weight": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.q_b_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.self_attn.q_b_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.kv_a_proj_with_mqa.weight": "model-00158-of-000163.safetensors", - "model.layers.60.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.kv_a_layernorm.weight": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.kv_b_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.self_attn.kv_b_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.self_attn.o_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.self_attn.o_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.gate.weight": "model-00158-of-000163.safetensors", "model.layers.60.mlp.gate.e_score_correction_bias": "model-00158-of-000163.safetensors", "model.layers.60.mlp.shared_experts.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.shared_experts.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.shared_experts.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.shared_experts.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.shared_experts.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.0.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.0.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.0.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.0.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.0.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.0.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.1.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.1.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.1.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.1.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.1.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.1.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.2.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.2.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.2.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.2.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.2.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.2.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.3.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.3.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.3.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.3.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.3.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.3.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.4.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.4.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.4.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.4.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.4.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.4.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.5.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.5.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.5.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.5.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.5.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.5.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.6.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.6.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.6.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.6.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.6.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.6.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.7.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.7.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.7.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.7.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.7.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.7.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.8.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.8.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.8.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.8.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.8.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.8.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.9.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.9.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.9.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.9.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.9.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.9.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.10.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.10.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.10.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.10.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.10.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.10.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.11.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.11.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.11.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.11.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.11.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.11.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.12.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.12.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.12.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.12.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.12.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.12.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.13.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.13.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.13.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.13.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.13.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.13.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.14.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.14.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.14.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.14.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.14.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.14.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.15.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.15.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.15.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.15.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.15.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.15.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.16.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.16.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.16.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.16.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.16.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.16.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.17.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.17.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.17.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.17.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.17.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.17.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.18.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.18.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.18.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.18.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.18.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.18.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.19.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.19.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.19.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.19.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.19.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.19.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.20.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.20.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.20.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.20.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.20.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.20.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.21.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.21.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.21.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.21.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.21.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.21.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.22.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.22.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.22.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.22.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.22.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.22.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.23.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.23.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.23.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.23.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.23.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.23.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.24.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.24.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.24.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.24.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.24.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.24.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.25.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.25.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.25.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.25.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.25.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.25.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.26.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.26.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.26.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.26.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.26.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.26.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.27.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.27.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.27.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.27.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.27.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.27.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.28.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.28.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.28.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.28.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.28.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.28.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.29.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.29.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.29.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.29.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.29.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.29.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.30.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.30.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.30.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.30.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.30.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.30.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.31.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.31.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.31.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.31.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.31.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.31.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.32.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.32.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.32.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.32.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.32.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.32.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.33.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.33.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.33.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.33.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.33.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.33.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.34.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.34.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.34.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.34.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.34.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.34.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.35.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.35.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.35.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.35.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.35.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.35.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.36.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.36.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.36.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.36.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.36.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.36.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.37.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.37.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.37.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.37.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.37.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.37.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.38.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.38.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.38.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.38.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.38.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.38.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.39.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.39.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.39.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.39.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.39.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.39.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.40.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.40.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.40.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.40.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.40.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.40.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.41.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.41.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.41.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.41.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.41.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.41.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.42.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.42.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.42.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.42.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.42.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.42.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.43.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.43.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.43.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.43.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.43.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.43.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.44.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.44.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.44.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.44.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.44.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.44.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.45.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.45.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.45.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.45.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.45.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.45.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.46.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.46.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.46.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.46.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.46.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.46.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.47.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.47.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.47.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.47.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.47.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.47.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.48.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.48.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.48.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.48.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.48.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.48.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.49.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.49.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.49.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.49.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.49.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.49.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.50.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.50.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.50.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.50.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.50.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.50.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.51.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.51.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.51.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.51.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.51.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.51.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.52.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.52.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.52.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.52.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.52.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.52.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.53.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.53.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.53.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.53.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.53.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.53.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.54.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.54.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.54.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.54.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.54.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.54.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.55.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.55.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.55.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.55.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.55.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.55.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.56.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.56.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.56.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.56.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.56.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.56.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.57.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.57.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.57.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.57.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.57.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.57.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.58.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.58.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.58.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.58.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.58.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.58.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.59.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.59.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.59.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.59.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.59.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.59.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.60.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.60.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.60.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.60.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.60.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.60.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.61.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.61.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.61.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.61.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.61.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.61.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.62.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.62.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.62.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.62.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.62.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.62.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.63.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.63.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.63.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.63.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.63.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.63.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.64.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.64.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.64.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.64.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.64.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.64.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.65.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.65.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.65.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.65.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.65.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.65.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.66.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.66.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.66.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.66.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.66.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.66.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.67.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.67.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.67.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.67.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.67.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.67.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.68.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.68.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.68.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.68.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.68.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.68.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.69.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.69.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.69.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.69.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.69.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.69.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.70.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.70.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.70.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.70.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.70.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.70.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.71.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.71.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.71.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.71.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.71.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.71.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.72.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.72.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.72.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.72.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.72.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.72.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.73.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.73.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.73.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.73.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.73.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.73.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.74.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.74.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.74.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.74.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.74.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.74.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.75.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.75.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.75.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.75.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.75.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.75.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.76.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.76.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.76.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.76.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.76.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.76.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.77.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.77.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.77.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.77.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.77.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.77.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.78.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.78.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.78.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.78.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.78.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.78.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.79.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.79.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.79.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.79.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.79.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.79.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.80.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.80.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.80.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.80.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.80.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.80.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.81.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.81.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.81.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.81.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.81.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.81.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.82.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.82.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.82.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.82.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.82.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.82.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.83.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.83.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.83.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.83.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.83.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.83.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.84.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.84.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.84.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.84.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.84.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.84.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.85.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.85.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.85.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.85.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.85.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.85.down_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.86.gate_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.86.gate_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.86.up_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.86.up_proj.weight_scale_inv": "model-00158-of-000163.safetensors", "model.layers.60.mlp.experts.86.down_proj.weight": "model-00158-of-000163.safetensors", - "model.layers.60.mlp.experts.86.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.87.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.87.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.87.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.87.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.87.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.87.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.88.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.88.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.88.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.88.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.88.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.88.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.89.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.89.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.89.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.89.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.89.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.89.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.90.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.90.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.90.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.90.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.90.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.90.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.91.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.91.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.91.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.91.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.91.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.91.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.92.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.92.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.92.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.92.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.92.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.92.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.93.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.93.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.93.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.93.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.93.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.93.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.94.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.94.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.94.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.94.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.94.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.94.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.95.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.95.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.95.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.95.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.95.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.95.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.96.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.96.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.96.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.96.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.96.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.96.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.97.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.97.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.97.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.97.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.97.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.97.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.98.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.98.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.98.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.98.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.98.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.98.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.99.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.99.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.99.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.99.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.99.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.99.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.100.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.100.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.100.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.100.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.100.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.100.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.101.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.101.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.101.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.101.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.101.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.101.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.102.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.102.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.102.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.102.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.102.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.102.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.103.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.103.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.103.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.103.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.103.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.103.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.104.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.104.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.104.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.104.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.104.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.104.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.105.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.105.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.105.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.105.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.105.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.105.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.106.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.106.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.106.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.106.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.106.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.106.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.107.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.107.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.107.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.107.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.107.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.107.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.108.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.108.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.108.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.108.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.108.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.108.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.109.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.109.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.109.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.109.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.109.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.109.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.110.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.110.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.110.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.110.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.110.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.110.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.111.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.111.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.111.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.111.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.111.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.111.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.112.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.112.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.112.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.112.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.112.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.112.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.113.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.113.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.113.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.113.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.113.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.113.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.114.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.114.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.114.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.114.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.114.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.114.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.115.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.115.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.115.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.115.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.115.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.115.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.116.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.116.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.116.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.116.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.116.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.116.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.117.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.117.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.117.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.117.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.117.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.117.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.118.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.118.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.118.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.118.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.118.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.118.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.119.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.119.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.119.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.119.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.119.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.119.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.120.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.120.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.120.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.120.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.120.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.120.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.121.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.121.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.121.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.121.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.121.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.121.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.122.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.122.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.122.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.122.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.122.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.122.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.123.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.123.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.123.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.123.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.123.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.123.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.124.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.124.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.124.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.124.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.124.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.124.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.125.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.125.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.125.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.125.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.125.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.125.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.126.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.126.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.126.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.126.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.126.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.126.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.127.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.127.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.127.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.127.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.127.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.127.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.128.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.128.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.128.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.128.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.128.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.128.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.129.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.129.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.129.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.129.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.129.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.129.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.130.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.130.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.130.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.130.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.130.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.130.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.131.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.131.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.131.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.131.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.131.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.131.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.132.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.132.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.132.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.132.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.132.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.132.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.133.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.133.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.133.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.133.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.133.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.133.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.134.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.134.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.134.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.134.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.134.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.134.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.135.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.135.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.135.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.135.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.135.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.135.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.136.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.136.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.136.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.136.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.136.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.136.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.137.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.137.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.137.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.137.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.137.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.137.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.138.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.138.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.138.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.138.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.138.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.138.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.139.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.139.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.139.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.139.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.139.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.139.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.140.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.140.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.140.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.140.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.140.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.140.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.141.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.141.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.141.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.141.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.141.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.141.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.142.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.142.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.142.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.142.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.142.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.142.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.143.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.143.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.143.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.143.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.143.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.143.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.144.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.144.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.144.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.144.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.144.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.144.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.145.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.145.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.145.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.145.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.145.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.145.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.146.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.146.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.146.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.146.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.146.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.146.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.147.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.147.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.147.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.147.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.147.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.147.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.148.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.148.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.148.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.148.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.148.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.148.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.149.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.149.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.149.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.149.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.149.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.149.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.150.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.150.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.150.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.150.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.150.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.150.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.151.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.151.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.151.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.151.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.151.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.151.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.152.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.152.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.152.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.152.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.152.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.152.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.153.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.153.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.153.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.153.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.153.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.153.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.154.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.154.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.154.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.154.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.154.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.154.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.155.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.155.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.155.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.155.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.155.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.155.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.156.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.156.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.156.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.156.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.156.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.156.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.157.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.157.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.157.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.157.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.157.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.157.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.158.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.158.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.158.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.158.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.158.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.158.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.159.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.159.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.159.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.159.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.159.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.159.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.160.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.160.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.160.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.160.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.160.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.160.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.161.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.161.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.161.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.161.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.161.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.161.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.162.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.162.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.162.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.162.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.162.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.162.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.163.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.163.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.163.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.163.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.163.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.163.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.164.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.164.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.164.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.164.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.164.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.164.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.165.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.165.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.165.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.165.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.165.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.165.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.166.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.166.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.166.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.166.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.166.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.166.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.167.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.167.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.167.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.167.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.167.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.167.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.168.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.168.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.168.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.168.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.168.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.168.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.169.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.169.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.169.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.169.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.169.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.169.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.170.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.170.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.170.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.170.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.170.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.170.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.171.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.171.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.171.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.171.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.171.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.171.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.172.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.172.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.172.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.172.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.172.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.172.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.173.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.173.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.173.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.173.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.173.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.173.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.174.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.174.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.174.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.174.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.174.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.174.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.175.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.175.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.175.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.175.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.175.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.175.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.176.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.176.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.176.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.176.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.176.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.176.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.177.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.177.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.177.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.177.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.177.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.177.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.178.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.178.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.178.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.178.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.178.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.178.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.179.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.179.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.179.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.179.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.179.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.179.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.180.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.180.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.180.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.180.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.180.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.180.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.181.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.181.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.181.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.181.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.181.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.181.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.182.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.182.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.182.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.182.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.182.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.182.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.183.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.183.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.183.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.183.up_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.183.down_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.183.down_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.184.gate_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.184.gate_proj.weight_scale_inv": "model-00159-of-000163.safetensors", "model.layers.60.mlp.experts.184.up_proj.weight": "model-00159-of-000163.safetensors", - "model.layers.60.mlp.experts.184.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.184.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.184.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.185.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.185.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.185.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.185.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.185.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.185.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.186.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.186.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.186.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.186.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.186.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.186.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.187.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.187.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.187.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.187.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.187.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.187.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.188.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.188.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.188.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.188.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.188.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.188.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.189.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.189.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.189.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.189.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.189.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.189.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.190.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.190.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.190.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.190.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.190.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.190.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.191.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.191.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.191.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.191.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.191.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.191.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.192.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.192.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.192.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.192.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.192.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.192.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.193.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.193.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.193.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.193.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.193.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.193.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.194.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.194.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.194.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.194.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.194.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.194.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.195.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.195.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.195.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.195.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.195.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.195.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.196.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.196.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.196.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.196.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.196.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.196.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.197.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.197.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.197.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.197.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.197.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.197.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.198.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.198.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.198.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.198.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.198.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.198.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.199.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.199.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.199.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.199.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.199.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.199.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.200.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.200.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.200.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.200.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.200.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.200.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.201.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.201.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.201.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.201.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.201.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.201.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.202.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.202.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.202.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.202.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.202.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.202.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.203.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.203.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.203.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.203.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.203.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.203.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.204.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.204.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.204.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.204.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.204.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.204.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.205.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.205.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.205.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.205.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.205.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.205.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.206.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.206.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.206.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.206.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.206.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.206.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.207.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.207.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.207.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.207.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.207.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.207.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.208.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.208.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.208.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.208.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.208.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.208.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.209.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.209.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.209.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.209.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.209.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.209.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.210.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.210.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.210.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.210.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.210.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.210.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.211.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.211.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.211.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.211.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.211.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.211.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.212.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.212.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.212.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.212.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.212.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.212.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.213.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.213.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.213.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.213.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.213.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.213.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.214.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.214.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.214.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.214.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.214.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.214.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.215.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.215.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.215.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.215.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.215.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.215.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.216.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.216.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.216.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.216.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.216.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.216.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.217.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.217.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.217.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.217.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.217.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.217.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.218.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.218.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.218.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.218.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.218.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.218.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.219.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.219.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.219.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.219.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.219.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.219.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.220.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.220.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.220.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.220.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.220.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.220.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.221.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.221.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.221.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.221.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.221.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.221.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.222.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.222.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.222.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.222.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.222.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.222.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.223.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.223.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.223.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.223.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.223.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.223.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.224.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.224.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.224.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.224.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.224.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.224.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.225.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.225.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.225.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.225.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.225.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.225.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.226.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.226.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.226.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.226.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.226.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.226.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.227.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.227.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.227.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.227.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.227.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.227.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.228.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.228.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.228.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.228.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.228.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.228.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.229.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.229.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.229.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.229.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.229.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.229.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.230.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.230.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.230.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.230.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.230.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.230.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.231.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.231.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.231.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.231.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.231.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.231.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.232.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.232.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.232.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.232.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.232.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.232.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.233.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.233.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.233.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.233.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.233.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.233.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.234.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.234.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.234.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.234.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.234.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.234.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.235.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.235.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.235.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.235.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.235.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.235.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.236.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.236.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.236.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.236.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.236.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.236.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.237.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.237.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.237.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.237.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.237.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.237.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.238.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.238.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.238.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.238.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.238.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.238.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.239.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.239.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.239.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.239.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.239.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.239.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.240.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.240.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.240.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.240.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.240.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.240.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.241.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.241.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.241.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.241.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.241.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.241.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.242.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.242.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.242.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.242.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.242.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.242.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.243.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.243.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.243.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.243.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.243.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.243.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.244.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.244.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.244.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.244.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.244.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.244.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.245.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.245.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.245.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.245.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.245.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.245.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.246.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.246.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.246.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.246.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.246.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.246.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.247.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.247.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.247.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.247.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.247.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.247.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.248.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.248.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.248.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.248.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.248.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.248.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.249.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.249.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.249.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.249.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.249.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.249.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.250.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.250.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.250.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.250.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.250.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.250.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.251.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.251.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.251.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.251.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.251.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.251.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.252.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.252.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.252.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.252.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.252.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.252.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.253.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.253.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.253.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.253.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.253.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.253.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.254.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.254.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.254.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.254.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.254.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.254.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.255.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.255.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.255.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.255.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.mlp.experts.255.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.60.mlp.experts.255.down_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.60.input_layernorm.weight": "model-00160-of-000163.safetensors", "model.layers.60.post_attention_layernorm.weight": "model-00160-of-000163.safetensors", "model.norm.weight": "model-00160-of-000163.safetensors", "lm_head.weight": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.q_a_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.self_attn.q_a_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.q_a_layernorm.weight": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.q_b_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.self_attn.q_b_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.kv_a_proj_with_mqa.weight": "model-00160-of-000163.safetensors", - "model.layers.61.self_attn.kv_a_proj_with_mqa.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.kv_a_layernorm.weight": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.kv_b_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.self_attn.kv_b_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.self_attn.o_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.self_attn.o_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.mlp.gate.weight": "model-00160-of-000163.safetensors", "model.layers.61.mlp.gate.e_score_correction_bias": "model-00160-of-000163.safetensors", "model.layers.61.mlp.shared_experts.gate_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.mlp.shared_experts.gate_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.mlp.shared_experts.up_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.mlp.shared_experts.up_proj.weight_scale_inv": "model-00160-of-000163.safetensors", "model.layers.61.mlp.shared_experts.down_proj.weight": "model-00160-of-000163.safetensors", - "model.layers.61.mlp.shared_experts.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.0.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.0.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.0.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.0.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.0.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.0.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.1.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.1.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.1.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.1.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.1.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.1.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.2.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.2.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.2.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.2.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.2.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.2.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.3.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.3.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.3.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.3.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.3.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.3.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.4.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.4.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.4.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.4.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.4.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.4.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.5.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.5.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.5.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.5.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.5.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.5.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.6.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.6.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.6.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.6.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.6.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.6.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.7.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.7.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.7.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.7.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.7.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.7.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.8.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.8.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.8.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.8.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.8.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.8.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.9.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.9.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.9.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.9.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.9.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.9.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.10.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.10.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.10.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.10.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.10.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.10.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.11.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.11.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.11.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.11.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.11.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.11.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.12.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.12.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.12.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.12.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.12.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.12.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.13.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.13.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.13.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.13.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.13.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.13.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.14.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.14.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.14.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.14.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.14.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.14.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.15.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.15.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.15.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.15.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.15.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.15.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.16.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.16.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.16.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.16.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.16.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.16.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.17.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.17.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.17.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.17.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.17.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.17.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.18.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.18.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.18.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.18.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.18.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.18.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.19.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.19.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.19.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.19.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.19.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.19.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.20.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.20.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.20.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.20.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.20.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.20.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.21.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.21.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.21.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.21.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.21.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.21.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.22.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.22.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.22.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.22.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.22.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.22.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.23.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.23.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.23.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.23.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.23.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.23.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.24.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.24.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.24.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.24.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.24.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.24.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.25.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.25.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.25.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.25.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.25.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.25.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.26.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.26.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.26.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.26.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.26.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.26.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.27.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.27.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.27.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.27.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.27.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.27.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.28.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.28.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.28.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.28.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.28.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.28.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.29.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.29.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.29.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.29.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.29.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.29.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.30.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.30.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.30.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.30.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.30.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.30.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.31.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.31.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.31.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.31.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.31.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.31.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.32.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.32.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.32.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.32.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.32.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.32.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.33.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.33.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.33.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.33.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.33.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.33.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.34.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.34.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.34.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.34.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.34.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.34.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.35.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.35.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.35.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.35.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.35.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.35.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.36.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.36.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.36.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.36.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.36.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.36.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.37.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.37.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.37.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.37.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.37.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.37.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.38.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.38.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.38.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.38.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.38.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.38.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.39.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.39.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.39.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.39.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.39.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.39.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.40.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.40.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.40.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.40.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.40.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.40.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.41.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.41.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.41.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.41.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.41.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.41.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.42.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.42.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.42.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.42.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.42.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.42.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.43.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.43.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.43.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.43.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.43.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.43.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.44.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.44.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.44.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.44.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.44.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.44.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.45.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.45.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.45.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.45.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.45.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.45.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.46.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.46.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.46.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.46.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.46.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.46.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.47.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.47.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.47.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.47.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.47.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.47.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.48.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.48.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.48.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.48.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.48.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.48.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.49.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.49.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.49.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.49.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.49.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.49.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.50.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.50.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.50.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.50.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.50.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.50.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.51.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.51.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.51.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.51.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.51.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.51.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.52.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.52.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.52.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.52.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.52.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.52.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.53.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.53.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.53.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.53.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.53.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.53.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.54.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.54.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.54.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.54.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.54.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.54.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.55.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.55.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.55.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.55.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.55.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.55.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.56.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.56.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.56.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.56.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.56.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.56.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.57.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.57.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.57.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.57.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.57.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.57.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.58.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.58.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.58.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.58.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.58.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.58.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.59.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.59.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.59.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.59.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.59.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.59.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.60.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.60.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.60.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.60.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.60.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.60.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.61.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.61.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.61.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.61.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.61.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.61.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.62.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.62.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.62.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.62.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.62.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.62.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.63.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.63.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.63.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.63.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.63.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.63.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.64.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.64.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.64.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.64.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.64.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.64.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.65.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.65.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.65.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.65.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.65.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.65.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.66.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.66.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.66.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.66.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.66.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.66.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.67.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.67.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.67.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.67.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.67.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.67.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.68.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.68.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.68.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.68.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.68.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.68.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.69.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.69.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.69.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.69.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.69.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.69.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.70.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.70.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.70.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.70.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.70.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.70.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.71.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.71.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.71.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.71.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.71.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.71.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.72.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.72.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.72.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.72.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.72.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.72.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.73.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.73.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.73.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.73.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.73.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.73.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.74.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.74.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.74.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.74.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.74.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.74.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.75.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.75.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.75.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.75.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.75.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.75.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.76.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.76.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.76.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.76.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.76.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.76.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.77.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.77.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.77.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.77.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.77.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.77.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.78.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.78.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.78.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.78.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.78.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.78.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.79.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.79.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.79.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.79.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.79.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.79.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.80.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.80.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.80.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.80.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.80.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.80.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.81.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.81.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.81.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.81.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.81.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.81.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.82.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.82.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.82.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.82.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.82.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.82.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.83.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.83.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.83.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.83.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.83.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.83.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.84.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.84.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.84.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.84.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.84.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.84.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.85.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.85.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.85.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.85.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.85.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.85.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.86.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.86.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.86.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.86.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.86.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.86.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.87.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.87.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.87.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.87.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.87.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.87.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.88.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.88.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.88.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.88.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.88.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.88.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.89.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.89.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.89.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.89.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.89.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.89.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.90.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.90.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.90.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.90.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.90.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.90.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.91.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.91.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.91.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.91.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.91.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.91.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.92.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.92.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.92.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.92.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.92.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.92.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.93.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.93.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.93.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.93.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.93.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.93.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.94.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.94.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.94.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.94.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.94.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.94.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.95.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.95.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.95.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.95.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.95.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.95.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.96.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.96.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.96.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.96.up_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.96.down_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.96.down_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.97.gate_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.97.gate_proj.weight_scale_inv": "model-00161-of-000163.safetensors", "model.layers.61.mlp.experts.97.up_proj.weight": "model-00161-of-000163.safetensors", - "model.layers.61.mlp.experts.97.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.97.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.97.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.98.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.98.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.98.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.98.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.98.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.98.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.99.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.99.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.99.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.99.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.99.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.99.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.100.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.100.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.100.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.100.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.100.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.100.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.101.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.101.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.101.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.101.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.101.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.101.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.102.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.102.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.102.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.102.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.102.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.102.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.103.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.103.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.103.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.103.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.103.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.103.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.104.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.104.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.104.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.104.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.104.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.104.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.105.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.105.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.105.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.105.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.105.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.105.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.106.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.106.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.106.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.106.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.106.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.106.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.107.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.107.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.107.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.107.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.107.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.107.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.108.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.108.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.108.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.108.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.108.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.108.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.109.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.109.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.109.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.109.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.109.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.109.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.110.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.110.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.110.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.110.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.110.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.110.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.111.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.111.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.111.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.111.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.111.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.111.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.112.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.112.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.112.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.112.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.112.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.112.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.113.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.113.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.113.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.113.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.113.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.113.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.114.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.114.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.114.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.114.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.114.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.114.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.115.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.115.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.115.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.115.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.115.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.115.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.116.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.116.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.116.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.116.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.116.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.116.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.117.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.117.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.117.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.117.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.117.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.117.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.118.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.118.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.118.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.118.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.118.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.118.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.119.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.119.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.119.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.119.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.119.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.119.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.120.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.120.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.120.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.120.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.120.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.120.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.121.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.121.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.121.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.121.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.121.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.121.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.122.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.122.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.122.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.122.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.122.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.122.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.123.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.123.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.123.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.123.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.123.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.123.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.124.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.124.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.124.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.124.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.124.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.124.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.125.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.125.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.125.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.125.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.125.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.125.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.126.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.126.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.126.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.126.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.126.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.126.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.127.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.127.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.127.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.127.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.127.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.127.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.128.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.128.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.128.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.128.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.128.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.128.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.129.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.129.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.129.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.129.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.129.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.129.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.130.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.130.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.130.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.130.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.130.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.130.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.131.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.131.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.131.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.131.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.131.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.131.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.132.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.132.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.132.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.132.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.132.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.132.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.133.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.133.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.133.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.133.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.133.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.133.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.134.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.134.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.134.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.134.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.134.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.134.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.135.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.135.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.135.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.135.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.135.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.135.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.136.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.136.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.136.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.136.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.136.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.136.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.137.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.137.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.137.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.137.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.137.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.137.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.138.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.138.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.138.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.138.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.138.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.138.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.139.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.139.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.139.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.139.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.139.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.139.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.140.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.140.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.140.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.140.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.140.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.140.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.141.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.141.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.141.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.141.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.141.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.141.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.142.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.142.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.142.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.142.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.142.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.142.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.143.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.143.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.143.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.143.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.143.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.143.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.144.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.144.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.144.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.144.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.144.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.144.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.145.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.145.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.145.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.145.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.145.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.145.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.146.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.146.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.146.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.146.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.146.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.146.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.147.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.147.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.147.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.147.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.147.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.147.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.148.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.148.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.148.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.148.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.148.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.148.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.149.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.149.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.149.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.149.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.149.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.149.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.150.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.150.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.150.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.150.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.150.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.150.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.151.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.151.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.151.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.151.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.151.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.151.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.152.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.152.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.152.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.152.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.152.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.152.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.153.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.153.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.153.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.153.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.153.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.153.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.154.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.154.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.154.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.154.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.154.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.154.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.155.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.155.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.155.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.155.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.155.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.155.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.156.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.156.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.156.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.156.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.156.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.156.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.157.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.157.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.157.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.157.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.157.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.157.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.158.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.158.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.158.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.158.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.158.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.158.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.159.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.159.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.159.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.159.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.159.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.159.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.160.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.160.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.160.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.160.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.160.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.160.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.161.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.161.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.161.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.161.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.161.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.161.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.162.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.162.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.162.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.162.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.162.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.162.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.163.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.163.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.163.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.163.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.163.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.163.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.164.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.164.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.164.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.164.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.164.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.164.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.165.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.165.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.165.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.165.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.165.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.165.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.166.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.166.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.166.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.166.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.166.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.166.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.167.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.167.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.167.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.167.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.167.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.167.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.168.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.168.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.168.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.168.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.168.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.168.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.169.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.169.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.169.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.169.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.169.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.169.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.170.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.170.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.170.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.170.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.170.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.170.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.171.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.171.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.171.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.171.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.171.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.171.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.172.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.172.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.172.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.172.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.172.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.172.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.173.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.173.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.173.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.173.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.173.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.173.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.174.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.174.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.174.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.174.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.174.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.174.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.175.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.175.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.175.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.175.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.175.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.175.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.176.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.176.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.176.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.176.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.176.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.176.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.177.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.177.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.177.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.177.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.177.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.177.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.178.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.178.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.178.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.178.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.178.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.178.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.179.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.179.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.179.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.179.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.179.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.179.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.180.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.180.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.180.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.180.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.180.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.180.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.181.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.181.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.181.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.181.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.181.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.181.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.182.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.182.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.182.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.182.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.182.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.182.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.183.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.183.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.183.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.183.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.183.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.183.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.184.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.184.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.184.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.184.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.184.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.184.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.185.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.185.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.185.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.185.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.185.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.185.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.186.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.186.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.186.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.186.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.186.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.186.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.187.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.187.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.187.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.187.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.187.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.187.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.188.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.188.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.188.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.188.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.188.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.188.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.189.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.189.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.189.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.189.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.189.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.189.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.190.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.190.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.190.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.190.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.190.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.190.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.191.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.191.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.191.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.191.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.191.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.191.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.192.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.192.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.192.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.192.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.192.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.192.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.193.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.193.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.193.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.193.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.193.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.193.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.194.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.194.gate_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.194.up_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.194.up_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.194.down_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.194.down_proj.weight_scale_inv": "model-00162-of-000163.safetensors", "model.layers.61.mlp.experts.195.gate_proj.weight": "model-00162-of-000163.safetensors", - "model.layers.61.mlp.experts.195.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.195.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.195.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.195.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.195.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.196.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.196.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.196.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.196.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.196.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.196.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.197.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.197.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.197.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.197.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.197.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.197.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.198.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.198.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.198.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.198.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.198.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.198.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.199.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.199.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.199.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.199.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.199.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.199.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.200.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.200.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.200.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.200.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.200.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.200.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.201.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.201.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.201.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.201.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.201.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.201.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.202.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.202.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.202.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.202.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.202.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.202.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.203.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.203.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.203.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.203.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.203.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.203.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.204.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.204.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.204.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.204.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.204.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.204.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.205.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.205.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.205.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.205.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.205.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.205.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.206.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.206.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.206.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.206.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.206.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.206.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.207.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.207.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.207.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.207.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.207.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.207.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.208.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.208.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.208.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.208.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.208.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.208.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.209.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.209.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.209.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.209.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.209.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.209.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.210.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.210.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.210.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.210.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.210.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.210.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.211.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.211.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.211.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.211.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.211.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.211.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.212.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.212.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.212.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.212.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.212.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.212.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.213.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.213.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.213.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.213.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.213.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.213.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.214.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.214.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.214.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.214.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.214.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.214.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.215.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.215.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.215.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.215.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.215.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.215.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.216.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.216.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.216.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.216.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.216.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.216.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.217.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.217.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.217.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.217.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.217.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.217.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.218.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.218.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.218.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.218.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.218.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.218.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.219.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.219.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.219.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.219.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.219.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.219.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.220.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.220.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.220.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.220.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.220.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.220.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.221.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.221.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.221.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.221.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.221.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.221.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.222.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.222.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.222.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.222.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.222.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.222.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.223.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.223.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.223.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.223.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.223.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.223.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.224.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.224.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.224.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.224.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.224.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.224.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.225.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.225.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.225.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.225.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.225.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.225.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.226.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.226.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.226.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.226.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.226.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.226.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.227.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.227.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.227.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.227.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.227.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.227.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.228.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.228.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.228.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.228.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.228.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.228.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.229.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.229.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.229.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.229.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.229.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.229.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.230.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.230.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.230.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.230.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.230.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.230.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.231.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.231.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.231.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.231.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.231.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.231.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.232.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.232.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.232.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.232.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.232.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.232.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.233.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.233.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.233.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.233.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.233.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.233.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.234.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.234.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.234.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.234.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.234.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.234.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.235.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.235.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.235.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.235.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.235.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.235.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.236.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.236.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.236.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.236.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.236.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.236.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.237.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.237.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.237.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.237.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.237.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.237.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.238.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.238.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.238.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.238.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.238.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.238.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.239.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.239.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.239.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.239.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.239.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.239.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.240.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.240.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.240.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.240.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.240.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.240.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.241.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.241.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.241.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.241.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.241.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.241.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.242.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.242.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.242.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.242.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.242.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.242.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.243.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.243.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.243.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.243.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.243.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.243.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.244.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.244.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.244.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.244.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.244.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.244.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.245.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.245.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.245.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.245.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.245.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.245.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.246.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.246.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.246.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.246.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.246.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.246.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.247.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.247.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.247.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.247.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.247.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.247.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.248.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.248.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.248.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.248.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.248.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.248.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.249.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.249.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.249.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.249.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.249.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.249.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.250.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.250.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.250.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.250.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.250.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.250.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.251.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.251.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.251.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.251.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.251.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.251.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.252.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.252.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.252.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.252.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.252.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.252.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.253.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.253.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.253.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.253.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.253.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.253.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.254.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.254.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.254.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.254.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.254.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.254.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.255.gate_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.255.gate_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.255.up_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.255.up_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.mlp.experts.255.down_proj.weight": "model-00163-of-000163.safetensors", - "model.layers.61.mlp.experts.255.down_proj.weight_scale_inv": "model-00163-of-000163.safetensors", "model.layers.61.input_layernorm.weight": "model-00163-of-000163.safetensors", "model.layers.61.post_attention_layernorm.weight": "model-00163-of-000163.safetensors", "model.layers.61.embed_tokens.weight": "model-00163-of-000163.safetensors",